Skip to content

Commit

Permalink
drat-drat
Browse files Browse the repository at this point in the history
  • Loading branch information
dchaplinsky committed Sep 13, 2023
1 parent 3a6ee1d commit b54e931
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@
"warmup_steps": 2000,
"model_name_or_path": "exps/gpt2-small.malyuk.nofilter.wechsel.largedict.sophia.tpu.run1",
"preprocessing_num_workers": 96,
"bf6": true,
"bf16": true,
"adam_beta1": 0.965,
"adam_beta2": 0.99,
"optimizer": "sophia"
Expand Down
3 changes: 2 additions & 1 deletion run_clm.py
Original file line number Diff line number Diff line change
Expand Up @@ -262,7 +262,8 @@ def main():

for (name, path) in [("train", data_args.train_file), ("validation", data_args.validation_file)]:
if path.endswith(".txt"):
raw_datasets[name] = datasets.Dataset.from_dict({"text": [open(path).read()], "id": [0]})
# raw_datasets[name] = datasets.Dataset.from_dict({"text": [open(path).read()], "id": [0]})
raw_datasets[name] = datasets.Dataset.from_dict({"text": [open(path).read()], "compound_id": [0], "id": [0]})
else:
raw_datasets[name] = datasets.load_from_disk(data_args.train_file)

Expand Down

0 comments on commit b54e931

Please sign in to comment.