diff --git a/代码/code/infer.py b/代码/code/infer.py index 6df0dd4..1745d7d 100644 --- a/代码/code/infer.py +++ b/代码/code/infer.py @@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'): print("[INFO] Model converted to FP16 (embedding kept in FP32)") # === 按 Expert 权重相似度合并冗余 expert === - _merge_experts(model, sim_threshold=0.97) + _merge_experts(model, sim_threshold=0.90) else: print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")