fix: 回退合并阈值到 0.90(甜点值,58.86 最优)

This commit is contained in:
2026-06-14 12:24:10 +08:00
parent e3590e6bda
commit 2ebb336e27
+1 -1
View File
@@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'):
print("[INFO] Model converted to FP16 (embedding kept in FP32)")
# === 按 Expert 权重相似度合并冗余 expert ===
_merge_experts(model, sim_threshold=0.80)
_merge_experts(model, sim_threshold=0.90)
else:
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")