-
Notifications
You must be signed in to change notification settings - Fork 17
# Pull Request: Deep Finance Judge System Enhancement #10
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
bac05b5
ba41164
c7ca8c7
7f2b017
9dd3c42
757f8a1
079e4bd
bcce8f0
4662d63
de81c1d
248acc4
9d651fd
7475ecc
b95d491
f20ab91
ea87d4b
3082bca
ef44b63
0889483
db7114c
5a25550
623b7d9
0aaab86
04f4959
d0ff68b
1c356d7
37dcbcc
529ae7e
f4eb231
1e07515
08ba184
3d55692
a478827
88be3e4
fb41962
a1f909b
8d2e5d7
3c85960
9b541c5
06fda5f
63cc682
c9b87ac
3bd4c7d
8a18d40
835bdd8
11ed325
a500e90
d9cbdc0
4538f5a
6f0c420
818a4f7
1bb7f60
460318f
57a3a54
beaa540
13d7d82
eb6e2af
4722a79
55d0ad1
68e25ae
3fb724a
6b9eb50
efa7fac
9e73442
f785b22
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,38 @@ | ||
| *.7z filter=lfs diff=lfs merge=lfs -text | ||
| *.arrow filter=lfs diff=lfs merge=lfs -text | ||
| *.bin filter=lfs diff=lfs merge=lfs -text | ||
| *.bin.* filter=lfs diff=lfs merge=lfs -text | ||
| *.bz2 filter=lfs diff=lfs merge=lfs -text | ||
| *.ftz filter=lfs diff=lfs merge=lfs -text | ||
| *.gz filter=lfs diff=lfs merge=lfs -text | ||
| *.h5 filter=lfs diff=lfs merge=lfs -text | ||
| *.joblib filter=lfs diff=lfs merge=lfs -text | ||
| *.lfs.* filter=lfs diff=lfs merge=lfs -text | ||
| *.model filter=lfs diff=lfs merge=lfs -text | ||
| *.msgpack filter=lfs diff=lfs merge=lfs -text | ||
| *.onnx filter=lfs diff=lfs merge=lfs -text | ||
| *.ot filter=lfs diff=lfs merge=lfs -text | ||
| *.parquet filter=lfs diff=lfs merge=lfs -text | ||
| *.pb filter=lfs diff=lfs merge=lfs -text | ||
| *.pt filter=lfs diff=lfs merge=lfs -text | ||
| *.pth filter=lfs diff=lfs merge=lfs -text | ||
| *.rar filter=lfs diff=lfs merge=lfs -text | ||
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text | ||
| *.tar.* filter=lfs diff=lfs merge=lfs -text | ||
| *.tflite filter=lfs diff=lfs merge=lfs -text | ||
| *.tgz filter=lfs diff=lfs merge=lfs -text | ||
| *.wasm filter=lfs diff=lfs merge=lfs -text | ||
| *.xz filter=lfs diff=lfs merge=lfs -text | ||
| *.zip filter=lfs diff=lfs merge=lfs -text | ||
| *.zstandard filter=lfs diff=lfs merge=lfs -text | ||
| *tfevents* filter=lfs diff=lfs merge=lfs -text | ||
| # Audio files - uncompressed | ||
| *.pcm filter=lfs diff=lfs merge=lfs -text | ||
| *.sam filter=lfs diff=lfs merge=lfs -text | ||
| *.raw filter=lfs diff=lfs merge=lfs -text | ||
| # Audio files - compressed | ||
| *.aac filter=lfs diff=lfs merge=lfs -text | ||
| *.flac filter=lfs diff=lfs merge=lfs -text | ||
| *.mp3 filter=lfs diff=lfs merge=lfs -text | ||
| *.ogg filter=lfs diff=lfs merge=lfs -text | ||
| *.wav filter=lfs diff=lfs merge=lfs -text |
Large diffs are not rendered by default.
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -15,17 +15,30 @@ JUDGE_CONCURRENCY=10 | |
| RM_WEIGHT=0.5 | ||
| PRESENTATION_QUALITY_WEIGHT=0.25 | ||
| GROUNDING_WEIGHT=0.25 | ||
| CGCV_WEIGHT=0.0 # 不使用 CGCV,设为 0 | ||
| AUDIT_WEIGHT=0.0 # 不使用 Audit,设为 0 | ||
| TRACEABILITY_WEIGHT=0.0 # 不使用 Traceability,设为 0 | ||
| EBTU_WEIGHT=0.0 # 不使用 EBTU,设为 0 | ||
|
|
||
| # 训练参数配置 | ||
| NUM_REPEAT=4 # group size,每个query rollout NUM_REPEAT次 | ||
| TRAIN_BATCH_SIZE=32 # 训练batchsize | ||
| NUM_STEPS=6 # 每个样本step轮数 | ||
| DEEPFINANCE_TOOL_RESULT_MAX_CHARS=10000 | ||
|
|
||
| # Env Service URL 配置 | ||
| ENV_SERVICE_URL="http://127.0.0.1:8080" # 环境服务地址 | ||
|
|
||
| # 主目录(需要更改) | ||
| export AJET_ROOT="/mnt/data_cpfs/taoshuchang.tsc/deepresearch/AgentJet_new" | ||
|
|
||
| NNODES=${WORLD_SIZE} | ||
| # 单机调试配置(默认值) | ||
| NNODES=${WORLD_SIZE:-1} | ||
| GPUS_PER_NODE=8 | ||
| CURRENT_TIME=$(date "+%Y%m%d_%H%M%S") | ||
| LOG_DIR="${AJET_ROOT}/logs/${PREFIX}" | ||
| TRAIN_LOG="${LOG_DIR}/train_${SUFFIX}_${CURRENT_TIME}.log" | ||
| mkdir -p ${LOG_DIR} | ||
|
|
||
| # 涉密的配置(API_KEY以及模型、数据位置)从.env读取 | ||
| cd ${AJET_ROOT} | ||
|
|
@@ -42,6 +55,9 @@ else | |
| echo -e "\033[31m警告: 找不到 .env 文件: $ENV_FILE\033[0m" | ||
| fi | ||
|
|
||
| export MODEL_PATH="/mnt/data_cpfs/taoshuchang.tsc/models/Qwen3-8B" | ||
|
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The It would be more robust to rely on the |
||
|
|
||
|
|
||
| #=============================================================================== | ||
| # 2. 动态生成配置文件 (从yaml template生成yaml) | ||
| #=============================================================================== | ||
|
|
@@ -57,6 +73,10 @@ sed -e "s|{{SUFFIX}}|${SUFFIX}|g" \ | |
| -e "s|{{RM_WEIGHT}}|${RM_WEIGHT}|g" \ | ||
| -e "s|{{PRESENTATION_QUALITY_WEIGHT}}|${PRESENTATION_QUALITY_WEIGHT}|g" \ | ||
| -e "s|{{GROUNDING_WEIGHT}}|${GROUNDING_WEIGHT}|g" \ | ||
| -e "s|{{CGCV_WEIGHT}}|${CGCV_WEIGHT}|g" \ | ||
| -e "s|{{AUDIT_WEIGHT}}|${AUDIT_WEIGHT}|g" \ | ||
| -e "s|{{TRACEABILITY_WEIGHT}}|${TRACEABILITY_WEIGHT}|g" \ | ||
| -e "s|{{EBTU_WEIGHT}}|${EBTU_WEIGHT}|g" \ | ||
| -e "s|{{OPENJUDGE_LLM}}|${OPENJUDGE_LLM}|g" \ | ||
| -e "s|{{RM_LLM}}|${RM_LLM}|g" \ | ||
| -e "s|{{JUDGE_CONCURRENCY}}|${JUDGE_CONCURRENCY}|g" \ | ||
|
|
@@ -68,10 +88,11 @@ sed -e "s|{{SUFFIX}}|${SUFFIX}|g" \ | |
| -e "s|{{TRAIN_REF_ANS_PATH}}|${TRAIN_REF_ANS_PATH}|g" \ | ||
| -e "s|{{VAL_REF_ANS_PATH}}|${VAL_REF_ANS_PATH}|g" \ | ||
| -e "s|{{CKPT_SAVE_PATH}}|${CKPT_SAVE_PATH}|g" \ | ||
| -e "s|{{ENV_SERVICE_URL}}|${ENV_SERVICE_URL}|g" \ | ||
| ${AJET_ROOT}/${CONFIG_TEMPLATE} > ${CONFIG_FILE} | ||
|
|
||
| echo "配置文件已生成: ${CONFIG_FILE}" | ||
| echo "参数确认: RM=${RM_WEIGHT}, PresentationQuality=${PRESENTATION_QUALITY_WEIGHT}, Grounding=${GROUNDING_WEIGHT}, OpenJudge=${OPENJUDGE_LLM}, RM_LLM=${RM_LLM}" | ||
| echo "参数确认: RM=${RM_WEIGHT}, PresentationQuality=${PRESENTATION_QUALITY_WEIGHT}, Grounding=${GROUNDING_WEIGHT}, CGCV=${CGCV_WEIGHT}, Audit=${AUDIT_WEIGHT}, Traceability=${TRACEABILITY_WEIGHT}, EBTU=${EBTU_WEIGHT}, OpenJudge=${OPENJUDGE_LLM}, RM_LLM=${RM_LLM}" | ||
|
|
||
|
|
||
| #=============================================================================== | ||
|
|
@@ -115,15 +136,16 @@ export RAY_CLUSTER_MODE="multi_node" | |
| #=============================================================================== | ||
| # 6. 主流程 | ||
| #=============================================================================== | ||
| log "节点数: ${NNODES}, 每节点GPU数: ${GPUS_PER_NODE}" | ||
| mkdir -p ${LOG_DIR} | ||
| mkdir -p $(dirname ${CONFIG_FILE}) | ||
| log "单机调试模式: NNODES=${NNODES}, GPUS_PER_NODE=${GPUS_PER_NODE}" | ||
|
|
||
| #=============================================================================== | ||
| # 6.1 Master 节点启动流程 | ||
| #=============================================================================== | ||
| # 启动训练任务(最核心) | ||
| # 请注意只有单节点需要--with-ray 多节点应该删除 | ||
| python ajet/launcher.py \ | ||
| --conf ${CONFIG_FILE} \ | ||
| --with-deepfinance \ | ||
| --with-ray \ | ||
| --backbone="debug" \ | ||
| 2>&1 | tee ${TRAIN_LOG} | ||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -1,11 +1,15 @@ | ||
| # 使得可以通过 from judge import PresentationQualityGrader 直接引用 | ||
| from .grounding.grader import GroundingGrader | ||
| from .presentation_quality.grader import PresentationQualityGrader | ||
| from .cgcv.grader import CGCVGrader | ||
| from .audit.grader import AuditGrader | ||
| from .traceability.grader import TraceabilityRewardGrader | ||
| from .ebtu.grader import EBTUTraceabilityGrader | ||
| # from .research_depth.grader import ResearchDepthGrader | ||
| # from .research_breadth.grader import ResearchBreadthGrader | ||
|
|
||
| # 以后添加了其他 grader 也可以加在这里 | ||
| # from .grounding.grader import GroundingGrader | ||
| # from .research_breadth.grader import ResearchBreadthGrader | ||
| # __all__ = ["PresentationQualityGrader", "GroundingGrader", "ResearchDepthGrader", "ResearchBreadthGrader"] | ||
| __all__ = ["PresentationQualityGrader", "GroundingGrader"] | ||
| __all__ = ["PresentationQualityGrader", "GroundingGrader", "CGCVGrader", "AuditGrader", "TraceabilityRewardGrader", "EBTUTraceabilityGrader"] |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,4 @@ | ||
| """Grounding Grader - 引用逻辑审计""" | ||
| from .grader import AuditGrader | ||
|
|
||
| __all__ = ["AuditGrader"] |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
This logging statement for tool statistics has been commented out. While this reduces log verbosity, it's generally better to control logging output through configuration or log levels rather than commenting out code. This allows for easily re-enabling detailed logs for debugging without code changes.
For example, you could use a logger with a configurable level, like
logger.debug(...), or wrap the log statement in a conditional check based on a configuration flag.