File tree Expand file tree Collapse file tree
tutorial/example_deep_finance Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -22,11 +22,16 @@ NUM_REPEAT=4 # group size,每个query rollout NUM_REPEAT次
2222TRAIN_BATCH_SIZE=32 # 训练batchsize
2323NUM_STEPS=6 # 每个样本step轮数
2424DEEPFINANCE_TOOL_RESULT_MAX_CHARS=10000
25+
2526# 主目录
2627export AJET_ROOT=" /mnt/data_cpfs/taoshuchang.tsc/deepresearch/AgentJet"
28+
29+ NNODES=${WORLD_SIZE}
30+
2731# 涉密的配置(API_KEY以及模型、数据位置)从.env读取
2832cd ${AJET_ROOT}
2933source .venv/bin/activate
34+
3035# API密钥配置 - 从 .env 文件加载
3136ENV_FILE=" ${AJET_ROOT} /.env"
3237if [ -f " $ENV_FILE " ]; then
@@ -112,12 +117,6 @@ ENV_SERVICE_LOG="${LOG_DIR}/env_service_${SUFFIX}_${CURRENT_TIME}.log"
112117TRAIN_LOG=" ${LOG_DIR} /train_${SUFFIX} _${CURRENT_TIME} .log"
113118
114119# 多机训练参数配置
115- if [ -z " ${WORLD_SIZE} " ]; then
116- echo " ERROR: WORLD_SIZE environment variable is not set!"
117- echo " Please ensure this script is run in a multi-node environment (e.g., PAI-DLC, SLURM)"
118- exit 1
119- fi
120- NNODES=${WORLD_SIZE}
121120GPUS_PER_NODE=8
122121EXPECTED_WORKERS=$WORLD_SIZE
123122
You can’t perform that action at this time.
0 commit comments