Skip to content

Commit 460318f

Browse files
committed
chore(config): update experiment suffix, prefix, and weight parameters
1 parent 1bb7f60 commit 460318f

File tree

1 file changed

+10
-58
lines changed

1 file changed

+10
-58
lines changed

tutorial/example_deep_finance/deep_finance_single.sh

Lines changed: 10 additions & 58 deletions
Original file line numberDiff line numberDiff line change
@@ -3,27 +3,27 @@ set -e
33
#===============================================================================
44
# 1. 配置区域 - 用户只需修改这里
55
#===============================================================================
6-
SUFFIX="ajet_deep_finance" # 实验后缀,影响所有日志和实验名称
7-
PREFIX="open" # 实验前缀,影响日志和实验所在文件夹
6+
SUFFIX="newjudge" # 实验后缀,影响所有日志和实验名称
7+
PREFIX="ajet_newjudge" # 实验前缀,影响日志和实验所在文件夹
88

99
# OpenJudge 模型配置
1010
OPENJUDGE_LLM='qwen-flash' # OpenJudge 评分模型
1111
RM_LLM='qwen-max' # RM Gallery 评分模型
1212
JUDGE_CONCURRENCY=10
1313

1414
# 奖励权重配置
15-
RM_WEIGHT=0.4
16-
CITATION_AUDIT_WEIGHT=0.2
17-
REPORT_RESOLUTION_WEIGHT=0.2
18-
TRAJECTORY_FAITHFULNESS_WEIGHT=0.2
15+
RM_WEIGHT=0.5
16+
PRESENTATION_QUALITY_WEIGHT=0.25
17+
GROUNDING_WEIGHT=0.25
1918

2019
# 训练参数配置
2120
NUM_REPEAT=4 # group size,每个query rollout NUM_REPEAT次
2221
TRAIN_BATCH_SIZE=32 # 训练batchsize
2322
NUM_STEPS=6 # 每个样本step轮数
2423
DEEPFINANCE_TOOL_RESULT_MAX_CHARS=10000
2524

26-
# 主目录
25+
# 主目录(需要更改)
26+
export AJET_ROOT="/mnt/data_cpfs/taoshuchang.tsc/deepresearch/AgentJet_new"
2727

2828
NNODES=${WORLD_SIZE}
2929

@@ -55,70 +55,23 @@ sed -e "s|{{SUFFIX}}|${SUFFIX}|g" \
5555
-e "s|{{MODEL_PATH}}|${MODEL_PATH}|g" \
5656
-e "s|{{NNODES}}|${NNODES}|g" \
5757
-e "s|{{RM_WEIGHT}}|${RM_WEIGHT}|g" \
58-
-e "s|{{CITATION_AUDIT_WEIGHT}}|${CITATION_AUDIT_WEIGHT}|g" \
58+
-e "s|{{PRESENTATION_QUALITY_WEIGHT}}|${PRESENTATION_QUALITY_WEIGHT}|g" \
59+
-e "s|{{GROUNDING_WEIGHT}}|${GROUNDING_WEIGHT}|g" \
5960
-e "s|{{OPENJUDGE_LLM}}|${OPENJUDGE_LLM}|g" \
6061
-e "s|{{RM_LLM}}|${RM_LLM}|g" \
6162
-e "s|{{JUDGE_CONCURRENCY}}|${JUDGE_CONCURRENCY}|g" \
62-
-e "s|{{REPORT_RESOLUTION_WEIGHT}}|${REPORT_RESOLUTION_WEIGHT}|g" \
63-
-e "s|{{TRAJECTORY_FAITHFULNESS_WEIGHT}}|${TRAJECTORY_FAITHFULNESS_WEIGHT}|g" \
6463
-e "s|{{NUM_REPEAT}}|${NUM_REPEAT}|g" \
6564
-e "s|{{NUM_STEPS}}|${NUM_STEPS}|g" \
6665
-e "s|{{TRAIN_BATCH_SIZE}}|${TRAIN_BATCH_SIZE}|g" \
6766
-e "s|{{TRAIN_DATA_PATH}}|${TRAIN_DATA_PATH}|g" \
6867
-e "s|{{VAL_DATA_PATH}}|${VAL_DATA_PATH}|g" \
69-
-e "s|{{ENV_SERVICE_URL}}|${ENV_SERVICE_URL}|g" \
7068
-e "s|{{TRAIN_REF_ANS_PATH}}|${TRAIN_REF_ANS_PATH}|g" \
7169
-e "s|{{VAL_REF_ANS_PATH}}|${VAL_REF_ANS_PATH}|g" \
7270
-e "s|{{CKPT_SAVE_PATH}}|${CKPT_SAVE_PATH}|g" \
7371
${AJET_ROOT}/${CONFIG_TEMPLATE} > ${CONFIG_FILE}
7472

7573
echo "配置文件已生成: ${CONFIG_FILE}"
76-
echo "参数确认: RM=${RM_WEIGHT}, Citation=${CITATION_AUDIT_WEIGHT}, OpenJudge=${OPENJUDGE_LLM}, RM_LLM=${RM_LLM}"
77-
78-
#===============================================================================
79-
# 3. 环境配置
80-
#===============================================================================
81-
# MongoDB 缓存配置
82-
CACHE_TYPE="mongodb"
83-
MONGO_URI="mongodb://${ADDR}:27117/"
84-
MONGO_DB_NAME="finworld_cache"
85-
MONGO_COLLECTION_NAME="tool_cache"
86-
export CACHE_TYPE MONGO_URI MONGO_DB_NAME MONGO_COLLECTION_NAME
87-
88-
# DeepFinance MCP 配置
89-
DEEPFINANCE_MCP_CONFIG="${AJET_ROOT}/tutorial/example_deep_finance/config/mcp_finance_tool_generated.json"
90-
91-
# 动态生成 MCP 配置文件
92-
mkdir -p $(dirname ${DEEPFINANCE_MCP_CONFIG})
93-
cat > ${DEEPFINANCE_MCP_CONFIG} << EOF
94-
{
95-
"mcpServers": {
96-
"flowllm": {
97-
"transport": "sse",
98-
"url": "http://${ADDR}:${MCP_PORT}/sse",
99-
"timeout": 600,
100-
"sse_read_timeout": 1200
101-
}
102-
}
103-
}
104-
EOF
105-
export DEEPFINANCE_MCP_CONFIG DEEPFINANCE_TOOL_RESULT_MAX_CHARS
106-
107-
# 其他服务配置
108-
HF_ENDPOINT="https://hf-mirror.com"
109-
ES_HOSTS="http://11.160.132.46:8200"
110-
export HF_ENDPOINT ES_HOSTS
111-
112-
# log 文件位置
113-
CURRENT_TIME=$(date "+%Y%m%d_%H%M%S")
114-
LOG_DIR="${AJET_ROOT}/logs/${PREFIX}"
115-
MASTER_IP_FILE="${LOG_DIR}/master-ip_${SUFFIX}.log"
116-
ENV_SERVICE_LOG="${LOG_DIR}/env_service_${SUFFIX}_${CURRENT_TIME}.log"
117-
TRAIN_LOG="${LOG_DIR}/train_${SUFFIX}_${CURRENT_TIME}.log"
118-
119-
# 多机训练参数配置
120-
GPUS_PER_NODE=8
121-
EXPECTED_WORKERS=$WORLD_SIZE
74+
echo "参数确认: RM=${RM_WEIGHT}, PresentationQuality=${PRESENTATION_QUALITY_WEIGHT}, Grounding=${GROUNDING_WEIGHT}, OpenJudge=${OPENJUDGE_LLM}, RM_LLM=${RM_LLM}"
12275

12376

12477
#===============================================================================
@@ -162,7 +115,6 @@ export RAY_CLUSTER_MODE="multi_node"
162115
#===============================================================================
163116
# 6. 主流程
164117
#===============================================================================
165-
log "开始多机多卡训练: ${SUFFIX}"
166118
log "节点数: ${NNODES}, 每节点GPU数: ${GPUS_PER_NODE}"
167119
mkdir -p ${LOG_DIR}
168120
mkdir -p $(dirname ${CONFIG_FILE})

0 commit comments

Comments
 (0)