From 654fa1792379d5fff3dc036dcb1445cf0f365fd4 Mon Sep 17 00:00:00 2001 From: Aurora Date: Sat, 6 Sep 2025 16:17:22 +0800 Subject: [PATCH] update --- run_file/experiment_1_4_10.sh | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/run_file/experiment_1_4_10.sh b/run_file/experiment_1_4_10.sh index d0aa2ed..e32733d 100644 --- a/run_file/experiment_1_4_10.sh +++ b/run_file/experiment_1_4_10.sh @@ -40,8 +40,8 @@ LOG_FILE="$LOG_DIR/experiment.log" # ---------------------------------------------------------------------------- # 🤖 硬件配置 # ---------------------------------------------------------------------------- -CUDA_VISIBLE_DEVICES="0,1,2,3" -NUM_PROCESSES="4" +CUDA_VISIBLE_DEVICES="0,1" +NUM_PROCESSES="2" MIXED_PRECISION="bf16" MAIN_PROCESS_PORT="29500" @@ -66,9 +66,9 @@ DISABLE_DB="false" # 🤖 训练超参数 # ---------------------------------------------------------------------------- EPOCHS="3" -EMBEDDING_EPOCH="42" -BATCH_SIZE="4" # 🔥 降低批次大小以适应更复杂的计算 -ACCUMULATION_STEPS="4" # 🔥 增加累积步数保持有效批次大小 +EMBEDDING_EPOCH="2" +BATCH_SIZE="42" # 🔥 降低批次大小以适应更复杂的计算 +ACCUMULATION_STEPS="8" # 🔥 增加累积步数保持有效批次大小 LEARNING_RATE="2e-4" # 🔥 适度降低学习率提升稳定性 DTYPE="bfloat16" GRAD_CLIP="1.0" @@ -80,8 +80,8 @@ SIMILARITY_LOSS_COEF="0.15" # 🔥 相似度损失系数(核心损失) DIVERSITY_LOSS_COEF="0.08" # 🔥 多样性损失系数(避免候选重复) # 数据和缓存路径 -DATA_PATH="/home/zym/Code/stable/merged_pretrain.jsonl" -DATABASE_INIT_PATH="/home/zym/Code/stable/sentence_trex_data.json" +DATA_PATH="dataset/stable/merged_pretrain.jsonl" +DATABASE_INIT_PATH="dataset/stable/sentence_trex_data.json" CLUSTER_CACHE_PATH="None" # 禁用聚类缓存 VAL_DATA_PATH="dataset/stable/eval_data.json"