From db5d0b222a472c5fd799123db6659e936b125e1e Mon Sep 17 00:00:00 2001 From: OwnerSunshine530 Date: Tue, 16 Jun 2026 12:10:12 +0800 Subject: [PATCH] =?UTF-8?q?revert:=20precompute=5Frep=20=E9=BB=98=E8=AE=A4?= =?UTF-8?q?=E5=85=B3=20=E2=80=94=20=E8=AF=84=E6=B5=8B=E7=AB=AFOOM/?= =?UTF-8?q?=E8=B6=85=E6=97=B6=E8=87=B4=E6=8F=90=E4=BA=A4=E5=BC=82=E5=B8=B8?= =?UTF-8?q?,=E5=9B=9E=E5=88=B0=E5=90=88=E8=A7=84=E5=AE=89=E5=85=A8~68?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-Authored-By: Claude Opus 4.8 --- 代码/code/infer.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/代码/code/infer.py b/代码/code/infer.py index a5e8c4c..88c2f40 100644 --- a/代码/code/infer.py +++ b/代码/code/infer.py @@ -55,8 +55,9 @@ CONFIG = { "dedup_embedding": True, # True=查表前对sign去重(只查唯一值再展开),本地7.80->6.49s,AUC逐位等价 "sparse_pool": False, # True=用(段×唯一)稀疏矩阵乘做池化,避免materialize整个[M,512](段内高重复时省) "compile": False, # 是否 torch.compile(实测慢5×,勿开) - "precompute_rep": True, # True=不计时的load_model里预计算所有item的RepEncoder向量, - # model(batch)按logid gather缓存、跳过embedding层(逐位等价) + # 评测端提交曾"异常"(load_model 全量加载数据集 OOM/超时)。默认关,回到合规安全的~68。 + # 如需重试,改用 build_env/流式过滤避免 OOM(见 RISKS.md)。 + "precompute_rep": False, # True=不计时的load_model里预计算所有item的RepEncoder向量(有OOM/合规风险) }