From 2dcd74ba8fc9c9ec6c73575a3058838e004c1fbc Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=88=98=E8=88=AA=E5=AE=87?= <3364451258@qq.com> Date: Sun, 14 Jun 2026 11:45:53 +0800 Subject: [PATCH] =?UTF-8?q?perf:=20=E9=99=8D=E4=BD=8E=E5=90=88=E5=B9=B6?= =?UTF-8?q?=E9=98=88=E5=80=BC=200.90=E2=86=920.85=EF=BC=88AUC=20=E4=B8=8D?= =?UTF-8?q?=E5=8F=98=EF=BC=8C=E7=BB=A7=E7=BB=AD=E6=89=A9=E5=A4=A7=E5=90=88?= =?UTF-8?q?=E5=B9=B6=E8=8C=83=E5=9B=B4=EF=BC=89?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- 代码/code/infer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/代码/code/infer.py b/代码/code/infer.py index 1745d7d..c24fb58 100644 --- a/代码/code/infer.py +++ b/代码/code/infer.py @@ -502,7 +502,7 @@ def load_model(ckpt_path, device='cuda:0'): print("[INFO] Model converted to FP16 (embedding kept in FP32)") # === 按 Expert 权重相似度合并冗余 expert === - _merge_experts(model, sim_threshold=0.90) + _merge_experts(model, sim_threshold=0.85) else: print(f"[WARNING] Checkpoint {ckpt_path} not found, using random weights")