fix: 降低 expert 合并阈值 0.97→0.90(过高导致几乎无合并)
This commit is contained in:
+1
-1
@@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'):
|
|||||||
print("[INFO] Model converted to FP16 (embedding kept in FP32)")
|
print("[INFO] Model converted to FP16 (embedding kept in FP32)")
|
||||||
|
|
||||||
# === 按 Expert 权重相似度合并冗余 expert ===
|
# === 按 Expert 权重相似度合并冗余 expert ===
|
||||||
_merge_experts(model, sim_threshold=0.97)
|
_merge_experts(model, sim_threshold=0.90)
|
||||||
else:
|
else:
|
||||||
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")
|
print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user