forked from mlfoundations/dclm
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcot_fix_plus_gpq_triviaqa.yaml
97 lines (89 loc) · 2.23 KB
/
cot_fix_plus_gpq_triviaqa.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
epoch: 1.25T
dataset: bigdata
num_params: 1B
max_seq_len: 2048
seed: 1
precision: fp32
# Tokenizer
tokenizer:
# name: [Add name from memory]
pretrained_model_name_or_path:
kwargs:
model_max_length: 2048
model:
name: open_lm
# pretrained_model_name_or_path: [add name from memory]
init_device: cpu
pretrained: true
load_path: # Add your (optional) Composer checkpoint path here!
device_eval_batch_size: 2
# FSDP config for model sharding
fsdp_config:
sharding_strategy: FULL_SHARD
mixed_precision: FULL
icl_tasks:
-
label: gsm8k_cot
dataset_uri: local_data/symbolic_problem_solving/gsm8k.jsonl
num_fewshot: [3]
icl_task_type: question_answering
cot_delimiter: ' #### '
continuation_delimiter: "\nA: Let's think step by step. "
question_prelimiter: "Q: "
early_stopping_criteria:
- "\n\n"
- "Q:"
- "Q: "
-
label: agi_eval_sat_math_cot
dataset_uri: local_data/symbolic_problem_solving/agi_eval_sat_math.jsonl
num_fewshot: [3]
icl_task_type: question_answering
cot_delimiter: ' #### '
continuation_delimiter: "\nA: Let's think step by step. "
question_prelimiter: "Q: "
early_stopping_criteria:
- "\n\n"
- "Q:"
- "Q: "
-
label: aqua_cot
dataset_uri: local_data/symbolic_problem_solving/aqua.jsonl
num_fewshot: [3]
icl_task_type: question_answering
cot_delimiter: ' #### '
continuation_delimiter: "\nA: Let's think step by step. "
question_prelimiter: "Q: "
early_stopping_criteria:
- "\n\n"
- "Q:"
- "Q: "
-
label: svamp_cot
dataset_uri: local_data/symbolic_problem_solving/svamp.jsonl
num_fewshot: [3]
icl_task_type: question_answering
continuation_delimiter: "\nUsing the formula below:\n"
cot_delimiter: ' #### '
question_prelimiter: "Q: "
early_stopping_criteria:
- "\n\n"
- "Q:"
- "Q: "
-
label: gpqa_main
dataset_uri: gpqa_data/gpqa_main.jsonl
num_fewshot: [5]
icl_task_type: multiple_choice
continuation_delimiter: "\nAnswer: "
-
label: gpqa_diamond
dataset_uri: gpqa_data/gpqa_diamond.jsonl
num_fewshot: [5]
icl_task_type: multiple_choice
continuation_delimiter: "\nAnswer: "
-
label: triviaqa_sm_sub
dataset_uri: local_data/world_knowledge/triviaqa_sm_sub.jsonl
num_fewshot: [3]
icl_task_type: question_answering