perf: 降低合并阈值 0.85→0.80(继续探底)
This commit is contained in:
+1
-1
@@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'):
|
||||
print("[INFO] Model converted to FP16 (embedding kept in FP32)")
|
||||
|
||||
# === 按 Expert 权重相似度合并冗余 expert ===
|
||||
_merge_experts(model, sim_threshold=0.85)
|
||||
_merge_experts(model, sim_threshold=0.80)
|
||||
else:
|
||||
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")
|
||||
|
||||
|
||||
Reference in New Issue
Block a user