fix: 降低 expert 合并阈值 0.97→0.90(过高导致几乎无合并)

This commit is contained in:
2026-06-14 11:32:19 +08:00
parent 3e1d5b8e59
commit 1e3b09e4cc
+1 -1
View File
@@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'):
print("[INFO] Model converted to FP16 (embedding kept in FP32)") print("[INFO] Model converted to FP16 (embedding kept in FP32)")
# === 按 Expert 权重相似度合并冗余 expert === # === 按 Expert 权重相似度合并冗余 expert ===
_merge_experts(model, sim_threshold=0.97) _merge_experts(model, sim_threshold=0.90)
else: else:
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights") print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")