Skip to content

Commit 60db2a9

Browse files
[GRPO] Make dataloader deterministic (#609)
Co-authored-by: Felipe Mello <fmellomascarenhas@gmail.com>
1 parent 9a05f62 commit 60db2a9

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

apps/grpo/main.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -262,6 +262,7 @@ class DatasetActor(ForgeActor):
262262
data_split: str = "train"
263263
streaming: bool = True
264264
model: str = "Qwen/Qwen3-1.7B"
265+
seed: int = 36
265266

266267
@endpoint
267268
async def setup(self):
@@ -291,7 +292,8 @@ def gsm8k_transform(sample):
291292
self.path, self.revision, split=self.data_split, streaming=self.streaming
292293
)
293294
self._base_dataset = self._base_dataset.map(gsm8k_transform)
294-
self._base_dataset = self._base_dataset.shuffle()
295+
self._base_dataset = self._base_dataset.shuffle(seed=self.seed)
296+
self._base_dataset.set_epoch(self._epoch)
295297
self._iterator = iter(self._base_dataset)
296298

297299
@endpoint

0 commit comments

Comments
 (0)