Skip to content

Commit 213f386

Browse files
authored
Add eval config for QWEN2_5 model using 0.5B variant (meta-pytorch#2230)
1 parent 9fd1ead commit 213f386

File tree

2 files changed

+45
-0
lines changed

2 files changed

+45
-0
lines changed
Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
# Config for EleutherEvalRecipe in eleuther_eval.py
2+
#
3+
# To launch, run the following command from root torchtune directory:
4+
# tune run eleuther_eval --config eleuther_evaluation tasks=["truthfulqa_mc2","hellaswag"]
5+
6+
output_dir: ./ # Not needed
7+
8+
# Model Arguments
9+
model:
10+
_component_: torchtune.models.qwen2_5.qwen2_5_0_5b
11+
12+
checkpointer:
13+
_component_: torchtune.training.FullModelHFCheckpointer
14+
checkpoint_dir: /tmp/Qwen2_5-0_5B-Instruct
15+
checkpoint_files: [
16+
model.safetensors,
17+
]
18+
output_dir: ${output_dir}
19+
model_type: QWEN2
20+
21+
# Tokenizer
22+
tokenizer:
23+
_component_: torchtune.models.qwen2_5.qwen2_5_tokenizer
24+
path: /tmp/Qwen2_5-0_5B-Instruct/vocab.json
25+
merges_file: /tmp/Qwen2_5-0_5B-Instruct/merges.txt
26+
max_seq_len: null
27+
28+
# Environment
29+
device: cuda
30+
dtype: bf16
31+
seed: 1234 # It is not recommended to change this seed, b/c it matches EleutherAI's default seed
32+
33+
# EleutherAI specific eval args
34+
tasks: ["truthfulqa_mc2"]
35+
limit: null
36+
max_seq_length: 4096
37+
batch_size: 8
38+
enable_kv_cache: True
39+
40+
# Quantization specific args
41+
quantizer: null

torchtune/_recipe_registry.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -457,6 +457,10 @@ class Recipe:
457457
name="qwen2/evaluation",
458458
file_path="qwen2/evaluation.yaml",
459459
),
460+
Config(
461+
name="qwen2_5/evaluation",
462+
file_path="qwen2_5/evaluation.yaml",
463+
),
460464
Config(
461465
name="gemma/evaluation",
462466
file_path="gemma/evaluation.yaml",

0 commit comments

Comments
 (0)