-
Notifications
You must be signed in to change notification settings - Fork 55
/
Copy pathllama3-1_finetune_remote.yaml
84 lines (75 loc) · 2.41 KB
/
llama3-1_finetune_remote.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
# Apache Software License 2.0
#
# Copyright (c) ZenML GmbH 2024. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
model:
name: llm-peft-llama-3-1
description: "Fine-tune `llama-3.1`."
tags:
- llm
- peft
- llama-3.1
version: 300_steps
settings:
docker:
parent_image: pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime
requirements: requirements.txt
python_package_installer: uv
python_package_installer_args:
system: null
apt_packages:
- git
environment:
PJRT_DEVICE: CUDA
USE_TORCH_XLA: "false"
MKL_SERVICE_FORCE_INTEL: "1"
parameters:
base_model_id: meta-llama/Meta-Llama-3.1-8B
use_fast: False
load_in_4bit: True
system_prompt: |
Given a target sentence construct the underlying meaning representation of the input sentence as a single function with attributes and attribute values.
This function should describe the target string accurately and the function must be one of the following ['inform', 'request', 'give_opinion', 'confirm', 'verify_attribute', 'suggest', 'request_explanation', 'recommend', 'request_attribute'].
The attributes must be one of the following: ['name', 'exp_release_date', 'release_year', 'developer', 'esrb', 'rating', 'genres', 'player_perspective', 'has_multiplayer', 'platforms', 'available_on_steam', 'has_linux_release', 'has_mac_release', 'specifier']
steps:
prepare_data:
parameters:
dataset_name: gem/viggo
finetune:
step_operator: gcp_a100
retry:
max_retries: 3
delay: 10
backoff: 2
parameters:
max_steps: 300
eval_steps: 30
bf16: True
evaluate_finetuned:
step_operator: gcp_a100
retry:
max_retries: 3
delay: 10
backoff: 2
evaluate_base:
step_operator: gcp_a100
retry:
max_retries: 3
delay: 10
backoff: 2
promote:
parameters:
metric: rouge2
target_stage: staging