Skip to content

Commit b5f0e8c

Browse files
author
Vincent Moens
committed
Update
[ghstack-poisoned]
1 parent 0a10089 commit b5f0e8c

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

sota-implementations/llm/grpo_mlgym_singlegpu.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@
3939
parser.add_argument("--batch_size", type=int, default=1)
4040
parser.add_argument("--epochs", type=int, default=1)
4141
parser.add_argument("--repeats", type=int, default=16)
42-
parser.add_argument("--num_envs", type=int, default=32)
42+
parser.add_argument("--num_envs", type=int, default=1)
4343
parser.add_argument("--steps_per_batch", type=int, default=64)
4444
parser.add_argument("--optim_batch_size", type=int, default=4)
4545
# parser.add_argument("--model_name", type=str, default="gpt2")
@@ -106,6 +106,7 @@ def make_env(tasks: list[str], tokenizer: PreTrainedTokenizer, transform: Transf
106106
total_dialog_turns=1_000_000,
107107
async_envs=True,
108108
replay_buffer=rb,
109+
yield_completed_trajectories=True,
109110
)
110111
for d in collector:
111112
print(d)

0 commit comments

Comments
 (0)