We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b247526 commit 0b57642Copy full SHA for 0b57642
.github/unittest/linux_libs/scripts_llm/run_test.sh
@@ -27,13 +27,10 @@ python -c "import transformers, datasets"
27
28
pytest test/test_rlhf.py --instafail -v --durations 200 --capture no --error-for-skips
29
30
-pytest examples/rlhf/train_rlhf.py \
+python examples/rlhf/train_rlhf.py \
31
sys.device=cuda:0 sys.ref_device=cuda:0 \
32
model.name_or_path=gpt2 train.max_epochs=2 \
33
data.batch_size=2 train.ppo.ppo_batch_size=2 \
34
train.ppo.ppo_num_epochs=1 reward_model.name_or_path= \
35
train.ppo.episode_length=8 train.ppo.num_rollouts_per_epoch=4 \
36
data.block_size=110 io.logger=csv
37
-
38
-coverage combine
39
-coverage xml -i
0 commit comments