perf: 降低合并阈值 0.90→0.85(AUC 不变,继续扩大合并范围)

This commit is contained in:
2026-06-14 11:45:53 +08:00
parent 1e3b09e4cc
commit 2dcd74ba8f
+1 -1
View File
@@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'):
print("[INFO] Model converted to FP16 (embedding kept in FP32)") print("[INFO] Model converted to FP16 (embedding kept in FP32)")
# === 按 Expert 权重相似度合并冗余 expert === # === 按 Expert 权重相似度合并冗余 expert ===
_merge_experts(model, sim_threshold=0.90) _merge_experts(model, sim_threshold=0.85)
else: else:
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights") print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")