diff --git a/examples/megatron/scripts/train_rlhf_llama.sh b/examples/megatron/scripts/train_rlhf_llama.sh index 93778d28..82ad5d15 100644 --- a/examples/megatron/scripts/train_rlhf_llama.sh +++ b/examples/megatron/scripts/train_rlhf_llama.sh @@ -115,4 +115,4 @@ num_gpu=${num_gpu} \ data_path=${DATASET_PATH} \ eval_data_path=${EVAL_DATASET_PATH} \ sample_per_episode=${sample_per_episode} \ -python entry/train_rlhf.py -c $configs 2>&1 | tee -a ${log_file} ; exit ${PIPESTATUS[0]} \ No newline at end of file +python entry/train_rlhf.py -c $configs 2>&1 | tee -a ${log_file} ; exit ${PIPESTATUS[0]} diff --git a/examples/megatron/tests/test_unbalanced_param_sync.sh b/examples/megatron/tests/test_unbalanced_param_sync.sh index 19f2bcdc..d207c282 100644 --- a/examples/megatron/tests/test_unbalanced_param_sync.sh +++ b/examples/megatron/tests/test_unbalanced_param_sync.sh @@ -55,4 +55,4 @@ num_episode=${num_ppo_episode:-0} \ data_path=${DATASET_PATH} \ eval_data_path=${EVAL_DATASET_PATH} \ sample_per_episode=${sample_per_episode} \ -python tests/test_unbalanced_param_sync.py -c $config_file 2>&1 | tee ${output_dir}/log_${RANK}.log ; exit ${PIPESTATUS[0]} \ No newline at end of file +python tests/test_unbalanced_param_sync.py -c $config_file 2>&1 | tee ${output_dir}/log_${RANK}.log ; exit ${PIPESTATUS[0]}