alibaba
diff --git a/‎.github/workflows/codestyle_ci.yml
+1-1 b/‎.github/workflows/codestyle_ci.yml
+1-1
diff --git a/‎.github/workflows/pytyping_ci.yml
+1-1 b/‎.github/workflows/pytyping_ci.yml
+1-1
diff --git a/‎.github/workflows/unittest_ci.yml
+1-1 b/‎.github/workflows/unittest_ci.yml
+1-1
diff --git a/‎.github/workflows/unittest_cpu_ci.yml
+1-1 b/‎.github/workflows/unittest_cpu_ci.yml
+1-1
diff --git a/‎.pre-commit-config.yaml
+3-4 b/‎.pre-commit-config.yaml
+3-4
diff --git a/‎.pyre_configuration
+3-3 b/‎.pyre_configuration
+3-3
diff --git a/‎docker/Dockerfile
+6-6 b/‎docker/Dockerfile
+6-6
diff --git a/‎docs/source/feature/feature.md
+2-2 b/‎docs/source/feature/feature.md
+2-2
diff --git a/‎docs/source/models/deepfm.md
+1-1 b/‎docs/source/models/deepfm.md
+1-1
diff --git a/‎docs/source/models/dssm.md
+1-1 b/‎docs/source/models/dssm.md
+1-1
diff --git a/‎docs/source/models/multi_tower.md
+1-1 b/‎docs/source/models/multi_tower.md
+1-1
diff --git a/‎docs/source/quick_start/dlc_odps_dataset_tutorial.md
+1-1 b/‎docs/source/quick_start/dlc_odps_dataset_tutorial.md
+1-1
diff --git a/‎docs/source/quick_start/dlc_tutorial.md
+1-1 b/‎docs/source/quick_start/dlc_tutorial.md
+1-1
diff --git a/‎docs/source/quick_start/local_tutorial.md
+5-5 b/‎docs/source/quick_start/local_tutorial.md
+5-5
diff --git a/‎docs/source/quick_start/local_tutorial_u2i_vec.md
+2-2 b/‎docs/source/quick_start/local_tutorial_u2i_vec.md
+2-2
diff --git a/‎docs/source/usage/train.md
+1-1 b/‎docs/source/usage/train.md
+1-1
diff --git a/‎requirements/gpu.txt
+1-2 b/‎requirements/gpu.txt
+1-2
diff --git a/‎requirements/runtime.txt
+4-3 b/‎requirements/runtime.txt
+4-3
diff --git a/‎requirements/test.txt
+1-1 b/‎requirements/test.txt
+1-1
diff --git a/‎scripts/build_docker.sh
+5-5 b/‎scripts/build_docker.sh
+5-5
diff --git a/‎scripts/ci_test.sh
-4 b/‎scripts/ci_test.sh
-4
diff --git a/‎scripts/pyre_check.py
+8 b/‎scripts/pyre_check.py
+8
@@ -9,7 +9,7 @@ jobs:
   ci-test:
     runs-on: tzrec-codestyle-runner
     container:
-      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.6
+      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.7
     steps:
       - name: FetchCommit ${{ github.event.pull_request.head.sha }}
         uses: actions/checkout@v2
 
@@ -9,7 +9,7 @@ jobs:
   ci-test:
     runs-on: tzrec-codestyle-runner
     container:
-      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.6
+      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.7
     steps:
       - name: FetchCommit ${{ github.event.pull_request.head.sha }}
         uses: actions/checkout@v2
 
@@ -9,7 +9,7 @@ jobs:
   ci-test:
     runs-on: tzrec-runner
     container:
-      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.6
+      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.7
       options: --gpus all --ipc host
     steps:
       - name: FetchCommit ${{ github.event.pull_request.head.sha }}
 
@@ -9,7 +9,7 @@ jobs:
   ci-test:
     runs-on: tzrec-cpu-runner
     container:
-      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.6-cpu
+      image: mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:0.7-cpu
       options: --ipc host
     steps:
       - name: FetchCommit ${{ github.event.pull_request.head.sha }}
 
@@ -6,11 +6,10 @@ repos:
         files: \.py$
         args: ["--license-filepath", "data/.license_header.txt", "--allow-past-years"]
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.7.1
+    rev: v0.8.6
     hooks:
       - id: ruff
         args: [ --fix ]
-        exclude: tzrec/acc/_decompositions.py|tzrec/acc/_aten_lowering_pass.py
       - id: ruff-format
   - repo: https://github.com/pre-commit/pre-commit-hooks
     rev: v5.0.0
@@ -25,12 +24,12 @@ repos:
       - id: mixed-line-ending
         args: ["--fix=lf"]
   - repo: https://github.com/codespell-project/codespell
-    rev: v2.3.0
+    rev: v2.4.1
     hooks:
       - id: codespell
         args: ["--skip", "*.json", "-L", "TBE"]
   - repo: https://github.com/executablebooks/mdformat
-    rev: 0.7.18
+    rev: 0.7.22
     hooks:
     - id: mdformat
       additional_dependencies:
 
@@ -4,9 +4,9 @@
     "tzrec/*/*_test.py",
     "tzrec/tests/*.py",
     "tzrec/utils/load_class.py",
-    "tzrec/acc/_*.py",
     "tzrec/tools/convert_easyrec_config_to_tzrec_config.py",
-    "tzrec/*/*_test_tmp.py"
+    "tzrec/*/*_test_tmp.py",
+    "tzrec/acc/export_utils.py"
   ],
   "site_package_search_strategy": "all",
   "source_directories": [
@@ -16,5 +16,5 @@
     }
   ],
   "strict": true,
-  "version": "0.9.21"
+  "version": "0.9.23"
 }
@@ -26,14 +26,14 @@ ENV PATH /opt/conda/bin:$PATH
 
 ARG DEVICE
 RUN case ${DEVICE} in \
-        "cu121") pip install torch==2.5.0 fbgemm-gpu==1.0.0 --index-url https://download.pytorch.org/whl/cu121 && \
+        "cu124") pip install torch==2.6.0 fbgemm-gpu==1.1.0 --index-url https://download.pytorch.org/whl/cu124 && \
                  pip uninstall -y nvidia-cuda-cupti-cu12 nvidia-cuda-nvrtc-cu12 nvidia-cufft-cu12 nvidia-curand-cu12 nvidia-cusolver-cu12 nvidia-cusparse-cu12 nvidia-nvjitlink-cu12 nvidia-nvtx-cu12 && \
-                 sed -i '/^Requires-Dist: nvidia-/d' /opt/conda/lib/python3.11/site-packages/torch-2.5.0+cu121.dist-info/METADATA && \
-                 pip install torchmetrics==1.0.3 torch_tensorrt==2.5.0 && \
-                 pip install torchrec==1.0.0 --index-url https://download.pytorch.org/whl/cu121 ;; \
-        * )      pip install torch==2.5.0 fbgemm-gpu==1.0.0 --index-url https://download.pytorch.org/whl/cpu && \
+                 sed -i '/^Requires-Dist: nvidia-/d' /opt/conda/lib/python3.11/site-packages/torch-2.6.0+cu124.dist-info/METADATA && \
+                 pip install torchmetrics==1.0.3 torch_tensorrt==2.6.0 --extra-index-url https://download.pytorch.org/whl/cu124 && \
+                 pip install torchrec==1.1.0 --index-url https://download.pytorch.org/whl/cu124 ;; \
+        * )      pip install torch==2.6.0 fbgemm-gpu==1.1.0 --index-url https://download.pytorch.org/whl/cpu && \
                  pip install torchmetrics==1.0.3 && \
-                 pip install torchrec==1.0.0 --index-url https://download.pytorch.org/whl/cpu ;; \
+                 pip install torchrec==1.1.0 --index-url https://download.pytorch.org/whl/cpu ;; \
     esac && \
     /opt/conda/bin/conda clean -ya
 
 
@@ -402,8 +402,8 @@ feature_configs: {
 
   | 方式               | 描述                                          | 备注                           |
   | ------------------ | --------------------------------------------- | ------------------------------ |
-  | query_common_ratio | 计算query与title间重复term数占query中term比例 | 取值为\[0,1\]                  |
-  | title_common_ratio | 计算query与title间重复term数占title中term比例 | 取值为\[0,1\]                  |
+  | query_common_ratio | 计算query与title间重复term数占query中term比例 | 取值为[0,1]                    |
+  | title_common_ratio | 计算query与title间重复term数占title中term比例 | 取值为[0,1]                    |
   | is_contain         | 计算query是否全部包含在title中，保持顺序      | 0表示未包含，1表示包含         |
   | is_equal           | 计算query是否与title完全相同                  | 0表示不完全相同，1表示完全相同 |
 
 
@@ -55,7 +55,7 @@ model_config {
 ```
 
 - feature_groups: 需要至少两个feature_group: wide和deep, fm可选
-- deepfm:  deepfm相关的参数
+- deepfm: deepfm相关的参数
   - deep: deep mlp的参数配置
     - hidden_units: mlp每一层的channel数目，即神经元的数目
   - wide_embedding_dim: wide部分输出的大小
 
@@ -97,7 +97,7 @@ model_config {
         - input: 输入feature_group名
         - hidden_units: mlp每一层的channel数目，即神经元的数目
     - output_dim: user/item输出embedding维度
-    - similarity: 向量相似度函数，包括\[COSINE, INNER_PRODUCT\]，默认INNER_PRODUCT
+    - similarity: 向量相似度函数，包括[COSINE, INNER_PRODUCT]，默认INNER_PRODUCT
   - dssm_v2: 参数同dssm
     - dssm_v2可以支持user与item塔 跨塔share embedding，但训练速度相对dssm_v1稍慢
     - 注意如果使用dssm_v2，data_config.force_base_data_group需要设置为true
 
@@ -51,7 +51,7 @@ model_config {
 }
 ```
 
-- feature_groups:  可配置多个feature_group，group name可以变
+- feature_groups: 可配置多个feature_group，group name可以变
 - multi_tower: multi_tower相关的参数
   - towers: 每个deep feature_group对应了一个tower。
     - input: 跟feature_group的group_name对应
 
@@ -34,7 +34,7 @@ bash upload_data.sh ${ODPS_PROJECT_NAME}
 
 进入[PAI控制台](https://pai.console.aliyun.com)，并选择需要使用的工作空间，点击 **模型开发与训练-分布式训练(DLC)**，点击创建任务。
 
-**节点镜像** 选择官方镜像`torcheasyrec:0.6.0-pytorch2.5.0-gpu-py311-cu121-ubuntu22.04`
+**节点镜像** 选择官方镜像`torcheasyrec:0.7.0-pytorch2.6.0-gpu-py311-cu124-ubuntu22.04`
 
 **数据集配置** 选择刚新建的NAS数据集
 
 
@@ -31,7 +31,7 @@ pip index versions tzrec -f http://tzrec.oss-cn-beijing.aliyuncs.com/release/nig
 
 进入[PAI控制台](https://pai.console.aliyun.com)，并选择需要使用的工作空间，点击 **模型开发与训练-分布式训练(DLC)**，点击创建任务。
 
-**节点镜像** 选择官方镜像`torcheasyrec:0.6.0-pytorch2.5.0-gpu-py311-cu121-ubuntu22.04`
+**节点镜像** 选择官方镜像`torcheasyrec:0.7.0-pytorch2.6.0-gpu-py311-cu124-ubuntu22.04`
 
 **数据集配置** 选择刚新建的NAS数据集
 
 
@@ -15,10 +15,10 @@ pip index versions tzrec -f http://tzrec.oss-cn-beijing.aliyuncs.com/release/nig
 ```bash
 conda create -n tzrec python=3.11
 conda activate tzrec
-pip install torch==2.5.0 --index-url https://download.pytorch.org/whl/cu121
-pip install fbgemm-gpu==1.0.0 --index-url https://download.pytorch.org/whl/cu121
+pip install torch==2.6.0 --index-url https://download.pytorch.org/whl/cu124
+pip install fbgemm-gpu==1.1.0 --index-url https://download.pytorch.org/whl/cu124
 pip install torchmetrics==1.0.3
-pip install torchrec==1.0.0 --index-url https://download.pytorch.org/whl/cu121
+pip install torchrec==1.1.0 --index-url https://download.pytorch.org/whl/cu124
 pip install tzrec==${TZREC_NIGHTLY_VERSION} -f http://tzrec.oss-cn-beijing.aliyuncs.com/release/nightly/repo.html --trusted-host tzrec.oss-cn-beijing.aliyuncs.com
 ```
 
@@ -33,8 +33,8 @@ pip install tzrec==${TZREC_NIGHTLY_VERSION} -f http://tzrec.oss-cn-beijing.aliyu
 注：
 
 ```
-GPU版本（CUDA 12.1) 镜像地址：
-  mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:${TZREC_DOCKER_VERSION}-cu121
+GPU版本（CUDA 12.4) 镜像地址：
+  mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:${TZREC_DOCKER_VERSION}-cu124
 CPU版本 镜像地址:
   mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec/tzrec-devel:${TZREC_DOCKER_VERSION}-cpu
 ```
 
@@ -126,7 +126,7 @@ OMP_NUM_THREADS=16 torchrun --master_addr=localhost --master_port=32555 \
 - --hitrate_details_output: （可选）hitrate详情输出表，会包含id | topk_ids | topk_dists
   | hitrate | hit_ids 五列
 - --batch_size: 评估batch_size，默认为1024
-- --index_type: 评估检索方式，默认为IVFFlatIP，可以选 \[IVFFlatIP, IVFFlatL2\]
+- --index_type: 评估检索方式，默认为IVFFlatIP，可以选 [IVFFlatIP, IVFFlatL2]
 - --top_k: 评估TopK召回的Hitrate，默认200
 - --ivf_nlist: IVFFlat索引的聚簇中心个数，默认为1000
 - --ivf_nprobe: IVFFlat索引的检索中心个数，默认为800
@@ -151,7 +151,7 @@ python -m tzrec.tools.create_faiss_index \
 - --embedding_input_path: 物品池向量表，需包含item_id | item_tower_emb两列
 - --index_output_dir: 物品池索引输出目录，一般指定用户塔目录，以保证模型版本和索引版本同时切换
 - --batch_size: 索引构建batch_size，默认为1024
-- --index_type: 评估检索方式，默认为IVFFlatIP，可以选 \[IVFFlatIP, HNSWFlatIP, IVFFlatL2, HNSWFlatL2\]
+- --index_type: 评估检索方式，默认为IVFFlatIP，可以选 [IVFFlatIP, HNSWFlatIP, IVFFlatL2, HNSWFlatL2]
 - --ivf_nlist: IVFFlat索引的聚簇中心个数，默认为1000
 - --hnsw_M: HNSWFlat索引的M参数
 - --hnsw_efConstruction: HNSWFlat索引的efConstruction参数
 
@@ -18,7 +18,7 @@ torchrun --master_addr=localhost --master_port=32555 \
 - --eval_input_path: 评估数据的输入路径
 - --continue_train: 是否增量训练
 - --fine_tune_checkpoint: 增量训练的checkpoint路径，如experiments/multi_tower_din_taobao_local/model.ckpt-0，如果不设置，增量训练使用model_dir下最近的检查点
-- --edit_config_json: 命令行以json的方式动态修改配置文件，如{"model_dir":"experiments/","feature_configs\[0\].raw_feature.boundaries":\[4,5,6,7\]}
+- --edit_config_json: 命令行以json的方式动态修改配置文件，如{"model_dir":"experiments/","feature_configs[0].raw_feature.boundaries":[4,5,6,7]}
 
 ### 环境变量
 
 
@@ -1,2 +1 @@
-torch-tensorrt @ http://tzrec.oss-cn-beijing.aliyuncs.com/third_party/trt/torch_tensorrt-2.5.0a0-cp311-cp311-linux_x86_64.whl ; python_version=="3.11"
-torch-tensorrt @ http://tzrec.oss-cn-beijing.aliyuncs.com/third_party/trt/torch_tensorrt-2.5.0a0-cp310-cp310-linux_x86_64.whl ; python_version=="3.10"
+torch-tensorrt==2.6.0
@@ -2,16 +2,17 @@ alibabacloud_credentials
 anytree
 common_io @ https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/common_io-0.4.1%2Btunnel-py2.py3-none-any.whl
 faiss-cpu
-fbgemm-gpu==1.0.0
+fbgemm-gpu==1.1.0
 graphlearn @ https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/graphlearn-1.3.3-cp311-cp311-linux_x86_64.whl ; python_version=="3.11"
 graphlearn @ https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/graphlearn-1.3.3-cp310-cp310-linux_x86_64.whl ; python_version=="3.10"
 grpcio-tools<1.63.0
+numpy<2
 pandas
 pyfg @ https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/pyfg-0.4.4-cp311-cp311-linux_x86_64.whl ; python_version=="3.11"
 pyfg @ https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/pyfg-0.4.4-cp310-cp310-linux_x86_64.whl ; python_version=="3.10"
 pyodps>=0.12.0
 scikit-learn
 tensorboard
-torch==2.5.0
+torch==2.6.0
 torchmetrics==1.0.3
-torchrec==1.0.0
+torchrec==1.1.0
@@ -1,3 +1,3 @@
 parameterized
 pre-commit
-pyre-check==0.9.21
+pyre-check==0.9.23
@@ -1,24 +1,24 @@
 #!/usr/bin/env bash
 
 REGISTRY=mybigpai-public-registry.cn-beijing.cr.aliyuncs.com/easyrec
-DOCKER_TAG=0.6
+DOCKER_TAG=0.7
 
 cp requirements.txt docker/
 rm -rf docker/requirements
 cp -r requirements/ docker/requirements
 cd docker
 
-for DEVICE in cu121 cpu
+for DEVICE in cu124 cpu
 do
     case ${DEVICE} in
-        "cu121") BASE_IMAGE=nvidia/cuda:12.1.1-devel-ubuntu22.04 ;;
+        "cu124") BASE_IMAGE=nvidia/cuda:12.4.1-devel-ubuntu22.04 ;;
         * )      BASE_IMAGE=ubuntu:22.04 ;;
     esac
     docker build --network host -t ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-${DEVICE} --build-arg DEVICE=${DEVICE} --build-arg BASE_IMAGE=${BASE_IMAGE} .
     docker push ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-${DEVICE}
 done
 
-docker images -q ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-cu121 | xargs -I {} docker tag {} ${REGISTRY}/tzrec-devel:${DOCKER_TAG}
-docker images -q ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-cu121 | xargs -I {} docker tag {} ${REGISTRY}/tzrec-devel:latest
+docker images -q ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-cu124 | xargs -I {} docker tag {} ${REGISTRY}/tzrec-devel:${DOCKER_TAG}
+docker images -q ${REGISTRY}/tzrec-devel:${DOCKER_TAG}-cu124 | xargs -I {} docker tag {} ${REGISTRY}/tzrec-devel:latest
 docker push ${REGISTRY}/tzrec-devel:${DOCKER_TAG}
 docker push ${REGISTRY}/tzrec-devel:latest
@@ -3,8 +3,4 @@
 pip install -r requirements.txt
 bash scripts/gen_proto.sh
 
-# just workaround for torch-tensorrt (dynamic shape) https://github.com/pytorch/TensorRT/pull/3289/files
-cp tzrec/acc/_aten_lowering_pass.py /opt/conda/lib/python3.11/site-packages/torch_tensorrt/dynamo/lowering/passes/_aten_lowering_pass.py
-cp tzrec/acc/_decompositions.py /opt/conda/lib/python3.11/site-packages/torch_tensorrt/dynamo/lowering/_decompositions.py
-
 MKL_THREADING_LAYER=GNU TORCH_DEVICE_BACKEND_AUTOLOAD=0 PYTHONPATH=. python tzrec/tests/run.py
@@ -29,6 +29,14 @@
     "Undefined attribute [16]: Module `pyarrow` has no attribute",
     "Undefined attribute [16]: Module `pyarrow.compute` has no attribute",
     "Undefined attribute [16]: Module `pyarrow.csv` has no attribute",
+    # type-safety of torch.nn.Module instances
+    # https://github.com/pytorch/pytorch/issues/81462
+    # Call error [29]: `typing.Union[nn.modules.module.Module, torch._tensor.Tensor]` is
+    # not a function.
+    "Union[nn.modules.module.Module, torch._tensor.Tensor]",
+    "Union[torch._tensor.Tensor, torch.nn.modules.module.Module]",
+    "Union[torch._tensor.Tensor, nn.modules.module.Module]",
+    "Union[Module, Tensor]",
 ]
 
 if __name__ == "__main__":
Original file line number	Diff line number	Diff line change
`@@ -51,7 +51,7 @@ model_config {`
`51`	`51`	`}`
`52`	`52`	```
`53`	`53`
`54`		`-- feature_groups: 可配置多个feature_group，group name可以变`
	`54`	`+- feature_groups: 可配置多个feature_group，group name可以变`
`55`	`55`	`- multi_tower: multi_tower相关的参数`
`56`	`56`	`- towers: 每个deep feature_group对应了一个tower。`
`57`	`57`	`- input: 跟feature_group的group_name对应`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1 @@`
`1`		`-torch-tensorrt @ http://tzrec.oss-cn-beijing.aliyuncs.com/third_party/trt/torch_tensorrt-2.5.0a0-cp311-cp311-linux_x86_64.whl ; python_version=="3.11"`
`2`		`-torch-tensorrt @ http://tzrec.oss-cn-beijing.aliyuncs.com/third_party/trt/torch_tensorrt-2.5.0a0-cp310-cp310-linux_x86_64.whl ; python_version=="3.10"`
	`1`	`+torch-tensorrt==2.6.0`