diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS new file mode 100644 index 0000000..0e93827 --- /dev/null +++ b/.github/CODEOWNERS @@ -0,0 +1,2 @@ +# Default owner for all paths. +* @haizhongzheng diff --git a/examples/code-multi-agent/qwen3-8b-codegen-verifier-m2po-full-2node/scripts/run_qwen3-8b-codegen-verifier-m2po-full-2node.sh b/examples/code-multi-agent/qwen3-8b-codegen-verifier-m2po-full-2node/scripts/run_qwen3-8b-codegen-verifier-m2po-full-2node.sh index 1224ba2..2db8220 100755 --- a/examples/code-multi-agent/qwen3-8b-codegen-verifier-m2po-full-2node/scripts/run_qwen3-8b-codegen-verifier-m2po-full-2node.sh +++ b/examples/code-multi-agent/qwen3-8b-codegen-verifier-m2po-full-2node/scripts/run_qwen3-8b-codegen-verifier-m2po-full-2node.sh @@ -146,6 +146,7 @@ WEIGHT_TRANSFER_HTTP_PORT="${WEIGHT_TRANSFER_HTTP_PORT_MODEL0}" \ examples/launch_trainer.py \ --config "${EXPERIMENT_CONFIG}" \ --trainer trainer_model0 \ + "$@" \ 2>&1 | tee "${LOG_DIR}/trainer_model0.log" & sleep 3 @@ -158,4 +159,5 @@ WEIGHT_TRANSFER_HTTP_PORT="${WEIGHT_TRANSFER_HTTP_PORT_MODEL1}" \ examples/launch_trainer.py \ --config "${EXPERIMENT_CONFIG}" \ --trainer trainer_model1 \ + "$@" \ 2>&1 | tee "${LOG_DIR}/trainer_model1.log" diff --git a/examples/search/qwen2.5-7b-instruct-m2po-delta/scripts/run_qwen2.5-7b-instruct-m2po-delta.sh b/examples/search/qwen2.5-7b-instruct-m2po-delta/scripts/run_qwen2.5-7b-instruct-m2po-delta.sh index 706009b..629b89f 100755 --- a/examples/search/qwen2.5-7b-instruct-m2po-delta/scripts/run_qwen2.5-7b-instruct-m2po-delta.sh +++ b/examples/search/qwen2.5-7b-instruct-m2po-delta/scripts/run_qwen2.5-7b-instruct-m2po-delta.sh @@ -134,4 +134,5 @@ WEIGHT_TRANSFER_HTTP_PORT="${WEIGHT_TRANSFER_HTTP_PORT_MODEL0}" \ examples/launch_trainer.py \ --config "${EXPERIMENT_CONFIG}" \ --trainer trainer_model0 \ + "$@" \ 2>&1 | tee "${LOG_DIR}/trainer_model0.log" diff --git a/examples/search/qwen2.5-7b-instruct-m2po-full/scripts/run_qwen2.5-7b-instruct-m2po-full.sh b/examples/search/qwen2.5-7b-instruct-m2po-full/scripts/run_qwen2.5-7b-instruct-m2po-full.sh index 318bffb..66fdc06 100755 --- a/examples/search/qwen2.5-7b-instruct-m2po-full/scripts/run_qwen2.5-7b-instruct-m2po-full.sh +++ b/examples/search/qwen2.5-7b-instruct-m2po-full/scripts/run_qwen2.5-7b-instruct-m2po-full.sh @@ -134,4 +134,5 @@ WEIGHT_TRANSFER_HTTP_PORT="${WEIGHT_TRANSFER_HTTP_PORT_MODEL0}" \ examples/launch_trainer.py \ --config "${EXPERIMENT_CONFIG}" \ --trainer trainer_model0 \ + "$@" \ 2>&1 | tee "${LOG_DIR}/trainer_model0.log"