diff --git a/.git_archival.txt b/.git_archival.txt
new file mode 100644
index 0000000000..8fb235d704
--- /dev/null
+++ b/.git_archival.txt
@@ -0,0 +1,4 @@
+node: $Format:%H$
+node-date: $Format:%cI$
+describe-name: $Format:%(describe:tags=true,match=*[0-9]*)$
+ref-names: $Format:%D$
diff --git a/.gitattributes b/.gitattributes
index e77d446ba6..776405a339 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -1,2 +1,4 @@
 # do not show up detailed difference on GitHub
 source/3rdparty/* linguist-generated=true
+source/3rdparty/README.md linguist-generated=false
+.git_archival.txt  export-subst
diff --git a/.github/workflows/build_cc.yml b/.github/workflows/build_cc.yml
index f029517d80..d851282cbc 100644
--- a/.github/workflows/build_cc.yml
+++ b/.github/workflows/build_cc.yml
@@ -24,9 +24,9 @@ jobs:
     - uses: actions/setup-python@v5
       with:
         python-version: '3.11'
-        cache: 'pip'
     - uses: lukka/get-cmake@latest
-    - run: python -m pip install tensorflow
+    - run: python -m pip install uv
+    - run: source/install/uv_with_retry.sh pip install --system tensorflow
     - run: |
          wget https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.0-1_all.deb \
          && sudo dpkg -i cuda-keyring_1.0-1_all.deb \
diff --git a/.github/workflows/build_wheel.yml b/.github/workflows/build_wheel.yml
index dd6b40c0b9..e203737424 100644
--- a/.github/workflows/build_wheel.yml
+++ b/.github/workflows/build_wheel.yml
@@ -65,23 +65,19 @@ jobs:
         with:
           # https://github.com/pypa/setuptools_scm/issues/480
           fetch-depth: 0
+      - name: Install uv
+        run: curl -LsSf https://astral.sh/uv/install.sh | sh
+        if: runner.os != 'Linux'
       - uses: docker/setup-qemu-action@v3
         name: Setup QEMU
         if: matrix.platform_id == 'manylinux_aarch64' && matrix.os == 'ubuntu-latest'
       # detect version in advance. See #3168
-      - uses: actions/setup-python@v5
-        name: Install Python
-        with:
-          python-version: '3.11'
-          cache: 'pip'
-        if: matrix.dp_pkg_name == 'deepmd-kit-cu11'
       - run: |
-          python -m pip install setuptools_scm
-          python -c "from setuptools_scm import get_version;print('SETUPTOOLS_SCM_PRETEND_VERSION='+get_version())" >> $GITHUB_ENV
+          echo "SETUPTOOLS_SCM_PRETEND_VERSION=$(pipx run uv tool run --from setuptools_scm python -m setuptools_scm)" >> $GITHUB_ENV
           rm -rf .git
         if: matrix.dp_pkg_name == 'deepmd-kit-cu11'
       - name: Build wheels
-        uses: pypa/cibuildwheel@v2.17
+        uses: pypa/cibuildwheel@v2.19
         env:
           CIBW_BUILD_VERBOSITY: 1
           CIBW_ARCHS: all
@@ -89,6 +85,7 @@ jobs:
           DP_VARIANT: ${{ matrix.dp_variant }}
           CUDA_VERSION: ${{ matrix.cuda_version }}
           DP_PKG_NAME: ${{ matrix.dp_pkg_name }}
+          CIBW_BUILD_FRONTEND: 'build[uv]'
       - uses: actions/upload-artifact@v4
         with:
           name: cibw-cp${{ matrix.python }}-${{ matrix.platform_id }}-cu${{ matrix.cuda_version }}-${{ strategy.job-index }}
@@ -100,14 +97,8 @@ jobs:
       - uses: actions/checkout@v4
         with:
           fetch-depth: 0
-      - uses: actions/setup-python@v5
-        name: Install Python
-        with:
-          python-version: '3.11'
-          cache: 'pip'
-      - run: python -m pip install build
       - name: Build sdist
-        run: python -m build --sdist
+        run: pipx run uv tool run --with build[uv] --from build python -m build --installer uv --sdist
 
       - uses: actions/upload-artifact@v4
         with:
@@ -161,7 +152,7 @@ jobs:
           images: ghcr.io/deepmodeling/deepmd-kit
 
       - name: Build and push Docker image
-        uses: docker/build-push-action@v5
+        uses: docker/build-push-action@v6
         with:
           context: source/install/docker
           push: ${{ github.repository_owner == 'deepmodeling' && github.event_name == 'push' && github.actor != 'dependabot[bot]' }}
diff --git a/.github/workflows/package_c.yml b/.github/workflows/package_c.yml
index 82567609e4..e932dd0eba 100644
--- a/.github/workflows/package_c.yml
+++ b/.github/workflows/package_c.yml
@@ -19,6 +19,8 @@ jobs:
             filename: libdeepmd_c_cu11.tar.gz
     steps:
       - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
       - name: Package C library
         run: ./source/install/docker_package_c.sh
         env:
diff --git a/.github/workflows/test_cc.yml b/.github/workflows/test_cc.yml
index 4a2ba7968a..8525c03648 100644
--- a/.github/workflows/test_cc.yml
+++ b/.github/workflows/test_cc.yml
@@ -20,7 +20,8 @@ jobs:
       with:
         mpi: mpich
     - uses: lukka/get-cmake@latest
-    - run: python -m pip install tensorflow
+    - run: python -m pip install uv
+    - run: source/install/uv_with_retry.sh pip install --system tensorflow
     # https://github.com/actions/runner-images/issues/9491
     - name: Fix kernel mmap rnd bits
       run: sudo sysctl vm.mmap_rnd_bits=28
@@ -34,11 +35,9 @@ jobs:
         CMAKE_GENERATOR: Ninja
         CXXFLAGS: ${{ matrix.check_memleak && '-fsanitize=leak' || '' }}
     # test lammps
-    # ASE issue: https://gitlab.com/ase/ase/-/merge_requests/2843
-    # TODO: remove ase version when ase has new release
     - run: |
-        python -m pip install -U pip
-        python -m pip install -e .[cpu,test,lmp] mpi4py "ase @ https://gitlab.com/ase/ase/-/archive/8c5aa5fd6448c5cfb517a014dccf2b214a9dfa8f/ase-8c5aa5fd6448c5cfb517a014dccf2b214a9dfa8f.tar.gz"
+        export TENSORFLOW_ROOT=$(python -c 'import importlib,pathlib;print(pathlib.Path(importlib.util.find_spec("tensorflow").origin).parent)')
+        source/install/uv_with_retry.sh pip install --system -e .[cpu,test,lmp] mpi4py
       env:
         DP_BUILD_TESTING: 1
       if: ${{ !matrix.check_memleak }}
diff --git a/.github/workflows/test_cuda.yml b/.github/workflows/test_cuda.yml
index 6435789933..660d022de9 100644
--- a/.github/workflows/test_cuda.yml
+++ b/.github/workflows/test_cuda.yml
@@ -33,11 +33,9 @@ jobs:
          && sudo apt-get update \
          && sudo apt-get -y install cuda-12-2 libcudnn8=8.9.5.*-1+cuda12.2
       if: false  # skip as we use nvidia image
-    - name: Set PyPI mirror for Aliyun cloud machine
-      run: python -m pip config --user set global.index-url https://mirrors.aliyun.com/pypi/simple/
-    - run: python -m pip install -U "pip>=21.3.1,!=23.0.0"
-    - run: python -m pip install "tensorflow>=2.15.0rc0"
-    - run: python -m pip install -v -e .[gpu,test,lmp,cu12] "ase @ https://gitlab.com/ase/ase/-/archive/8c5aa5fd6448c5cfb517a014dccf2b214a9dfa8f/ase-8c5aa5fd6448c5cfb517a014dccf2b214a9dfa8f.tar.gz"
+    - run: python -m pip install -U uv
+    - run: source/install/uv_with_retry.sh pip install --system "tensorflow>=2.15.0rc0"
+    - run: source/install/uv_with_retry.sh pip install --system -v -e .[gpu,test,lmp,cu12]
       env:
         DP_BUILD_TESTING: 1
         DP_VARIANT: cuda
diff --git a/.github/workflows/test_python.yml b/.github/workflows/test_python.yml
index 28df7b5625..956c91e491 100644
--- a/.github/workflows/test_python.yml
+++ b/.github/workflows/test_python.yml
@@ -21,18 +21,20 @@ jobs:
     - uses: actions/setup-python@v5
       with:
         python-version: ${{ matrix.python }}
-        cache: 'pip'
     - uses: mpi4py/setup-mpi@v1
       if: ${{ matrix.tf == '' }}
       with:
         mpi: openmpi
-    # https://github.com/pypa/pip/issues/11770
-    - run: python -m pip install -U "pip>=21.3.1,!=23.0.0"
-    - run: pip install -e .[cpu,test]
+    - run: curl -LsSf https://astral.sh/uv/install.sh | sh
+    - run: source/install/uv_with_retry.sh pip install --system -e .[cpu,test]
       env:
+        # Please note that uv has some issues with finding
+        # existing TensorFlow package. Currently, it uses
+        # TensorFlow in the build dependency, but if it
+        # changes, setting `TENSORFLOW_ROOT`.
         TENSORFLOW_VERSION: ${{ matrix.tf }}
         DP_BUILD_TESTING: 1
-    - run: pip install horovod mpi4py
+    - run: source/install/uv_with_retry.sh pip install --system --no-build-isolation horovod mpi4py
       if: ${{ matrix.tf == '' }}
       env:
         HOROVOD_WITH_TENSORFLOW: 1
diff --git a/.gitignore b/.gitignore
index 82d3e4a7da..572f9bf229 100644
--- a/.gitignore
+++ b/.gitignore
@@ -43,3 +43,4 @@ build_cc_tests
 build_c_tests
 build_c/
 libdeepmd_c/
+.uv/
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 7e0b0a4a76..9b3f099acb 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -2,7 +2,7 @@
 # See https://pre-commit.com/hooks.html for more hooks
 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v4.5.0
+    rev: v4.6.0
     hooks:
       - id: trailing-whitespace
         exclude: "^.+\\.pbtxt$"
@@ -29,7 +29,7 @@ repos:
         exclude: ^source/3rdparty
   - repo: https://github.com/astral-sh/ruff-pre-commit
     # Ruff version.
-    rev: v0.3.5
+    rev: v0.4.10
     hooks:
       - id: ruff
         args: ["--fix"]
@@ -52,7 +52,7 @@ repos:
       - id: blacken-docs
   # C++
   - repo: https://github.com/pre-commit/mirrors-clang-format
-    rev: v18.1.2
+    rev: v18.1.7
     hooks:
       - id: clang-format
         exclude: ^source/3rdparty|source/lib/src/gpu/cudart/.+\.inc
@@ -75,6 +75,25 @@ repos:
     hooks:
       - id: cmake-format
       #- id: cmake-lint
+  - repo: https://github.com/njzjz/mirrors-bibtex-tidy
+    rev: v1.13.0
+    hooks:
+      - id: bibtex-tidy
+        args:
+          - --curly
+          - --numeric
+          - --align=13
+          - --blank-lines
+          # disable sort: the order of keys and fields has explict meanings
+          #- --sort=key
+          - --duplicates=key,doi,citation,abstract
+          - --merge=combine
+          #- --sort-fields
+          #- --strip-comments
+          - --trailing-commas
+          - --encode-urls
+          - --remove-empty-fields
+          - --wrap=80
   # license header
   - repo: https://github.com/Lucas-C/pre-commit-hooks
     rev: v1.5.5
diff --git a/.readthedocs.yml b/.readthedocs.yml
index 6f3ff6be3f..e8b81a4109 100644
--- a/.readthedocs.yml
+++ b/.readthedocs.yml
@@ -2,7 +2,10 @@ version: 2
 build:
   os: ubuntu-20.04
   tools:
-    python: mambaforge-4.10
-conda:
-  environment: doc/environment.yml
+    python: "3.11"
+  jobs:
+    post_create_environment:
+      - pip install uv
+    post_install:
+      - VIRTUAL_ENV=$READTHEDOCS_VIRTUALENV_PATH uv pip install -r doc/requirements.txt
 formats: all
diff --git a/CITATIONS.bib b/CITATIONS.bib
index ac682b28f7..a05e7ef9ee 100644
--- a/CITATIONS.bib
+++ b/CITATIONS.bib
@@ -1,272 +1,342 @@
-The proposed feature of each article is described in the "annote" field.
-Please cite a article if any feature is used
-
-@article{Wang_ComputPhysCommun_2018_v228_p178,
-    annote = {general purpose},
-    author = {Wang, Han and Zhang, Linfeng and Han, Jiequn and E, Weinan},
-    doi = {10.1016/j.cpc.2018.03.016},
-    year = 2018,
-    month = {jul},
-    publisher = {Elsevier {BV}},
-    volume = 228,
-    journal = {Comput. Phys. Comm.},
-    title = {{DeePMD-kit: A deep learning package for many-body potential
-	      energy representation and molecular dynamics}},
-    pages = {178--184},
-}
-
-@Article{Zeng_JChemPhys_2023_v159_p054801,
-    annote = {general purpose},
-    title  = {{DeePMD-kit v2: A software package for deep potential models}},
-    author =   {Jinzhe Zeng and Duo Zhang and Denghui Lu and Pinghui Mo and Zeyu Li
-             and Yixiao Chen and Mari{\'a}n Rynik and Li'ang Huang and Ziyao Li and
-             Shaochen Shi and Yingze Wang and Haotian Ye and Ping Tuo and Jiabin
-             Yang and Ye Ding and Yifan Li and Davide Tisi and Qiyu Zeng and Han
-             Bao and Yu Xia and Jiameng Huang and Koki Muraoka and Yibo Wang and
-             Junhan Chang and Fengbo Yuan and Sigbj{\o}rn L{\o}land Bore and Chun
-             Cai and Yinnian Lin and Bo Wang and Jiayan Xu and Jia-Xin Zhu and
-             Chenxing Luo and Yuzhi Zhang and Rhys E A Goodall and Wenshuo Liang
-             and Anurag Kumar Singh and Sikai Yao and Jingchao Zhang and Renata
-             Wentzcovitch and Jiequn Han and Jie Liu and Weile Jia and Darrin M
-             York and Weinan E and Roberto Car and Linfeng Zhang and Han Wang},
-    journal =  {J. Chem. Phys.},
-    volume =   159,
-    issue =    5,
-    year =    2023,
-    pages  =   054801,
-    doi =      {10.1063/5.0155600},
-}
-
-
-@article{Lu_CompPhysCommun_2021_v259_p107624,
-    annote = {GPU support},
-    title={{86 PFLOPS Deep Potential Molecular Dynamics simulation of 100 million
-            atoms with ab initio accuracy}},
-    author={Lu, Denghui and Wang, Han and Chen, Mohan and Lin, Lin and Car, Roberto
-            and E, Weinan and Jia, Weile and Zhang, Linfeng},
-    journal={Comput. Phys. Comm.},
-    volume={259},
-    pages={107624},
-    year={2021},
-    publisher={Elsevier},
-    doi={10.1016/j.cpc.2020.107624},
-}
-
-@article{Zhang_PhysRevLett_2018_v120_p143001,
-    annote =          {local frame (loc_frame)},
-    author =        {Linfeng Zhang and Jiequn Han and Han Wang and
-                    Roberto Car and Weinan E},
-    journal =       {Phys. Rev. Lett.},
-    number =        {14},
-    pages =         {143001},
-    publisher =     {APS},
-    title =         {{Deep potential molecular dynamics: a scalable model
-                    with the accuracy of quantum mechanics}},
-    volume =        {120},
-    year =          {2018},
-    doi =           {10.1103/PhysRevLett.120.143001}
-}
-
-@incollection{Zhang_BookChap_NIPS_2018_v31_p4436,
-    annote = {DeepPot-SE (se_e2_a, se_e2_r, se_e3, se_atten)},
-	title = {{End-to-end Symmetry Preserving Inter-atomic Potential Energy Model
-             for Finite and Extended Systems}},
-	author = {Zhang, Linfeng and Han, Jiequn and Wang, Han and Saidi, Wissam and
-              Car, Roberto and E, Weinan},
-	booktitle = {Advances in Neural Information Processing Systems 31},
-	editor = {S. Bengio and H. Wallach and H. Larochelle and K. Grauman and N.
-              Cesa-Bianchi and R. Garnett},
-	pages = {4436--4446},
-	year = {2018},
-	publisher = {Curran Associates, Inc.},
-	url = {https://dl.acm.org/doi/10.5555/3327345.3327356}
-}
-
-@Article{Wang_NuclFusion_2022_v62_p126013,
-    annote =     {three-body embedding DeepPot-SE (se_e3)},
-    author =   {Xiaoyang Wang and Yinan Wang and Linfeng Zhang and Fuzhi Dai and Han
-             Wang},
-    title =    {{A tungsten deep neural-network potential for simulating mechanical
-             property degradation under fusion service environment}},
-    journal =  {Nucl. Fusion},
-    year =     2022,
-    volume =   62,
-    issue =    12,
-    pages =    126013,
-    doi =      {10.1088/1741-4326/ac888b},
-}
-
-@misc{Zhang_2022_DPA1,
-    annote = {attention-based descriptor},
-    author = {Zhang, Duo and Bi, Hangrui and Dai, Fu-Zhi and Jiang, Wanrun and Zhang, Linfeng and Wang, Han},
-    title = {{DPA-1: Pretraining of Attention-based Deep Potential Model for Molecular Simulation}},
-    publisher = {arXiv},
-    year = {2022},
-    doi = {10.48550/arXiv.2208.08236},
-}
-
-@article{Zhang_PhysPlasmas_2020_v27_p122704,
-    annote = {frame-specific parameters (e.g. electronic temperature)},
-    author = {Zhang, Yuzhi and Gao, Chang and Liu, Qianrui and Zhang, Linfeng and Wang, Han and Chen, Mohan},
-    title = {{Warm dense matter simulation via electron temperature dependent deep potential molecular dynamics}},
-    journal = {Phys. Plasmas},
-    volume = {27},
-    number = {12},
-    pages = {122704},
-    year = {2020},
-    month = {12},
-    doi = {10.1063/5.0023265},
-}
-
-@misc{Zeng_2023_TTMDPMD,
-   annote = {atom-specific parameter (e.g. electron temperature) },
-   author = {Zeng, Qiyu and Chen, Bo and Zhang, Shen and Kang, Dongdong and Wang, Han and Yu, Xiaoxiang and Dai, Jiayu},
-   title = {{Full-scale ab initio simulations of laser-driven atomistic dynamics}},
-   publisher = {arXiv},
-   year = {2023},
-   doi = {10.48550/arXiv.2308.13863},
-}
-
-@article{Zhang_PhysRevB_2020_v102_p41121,
-    annote = {fit dipole},
-    title={{Deep neural network for the dielectric response of insulators}},
-    author={Zhang, Linfeng and Chen, Mohan and Wu, Xifan and Wang, Han and E, Weinan and Car, Roberto},
-    journal={Phys. Rev. B},
-    volume={102},
-    number={4},
-    pages={041121},
-    year={2020},
-    publisher={APS},
-    doi={10.1103/PhysRevB.102.041121}
-}
-
-@article{Sommers_PhysChemChemPhys_2020_v22_p10592,
-    annote = {fit polarizability},
-    title={{Raman spectrum and polarizability of liquid water from deep neural networks}},
-    author={Sommers, Grace M and Andrade, Marcos F Calegari and Zhang, Linfeng and Wang, Han and Car, Roberto},
-    journal={Phys. Chem. Chem. Phys.},
-    volume={22},
-    number={19},
-    pages={10592--10602},
-    year={2020},
-    publisher={Royal Society of Chemistry},
-    doi={10.1039/D0CP01893G}
-}
-
-@Article{Zeng_JChemTheoryComput_2023_v19_p1261,
-    annote = {fit relative energies},
-    author =   {Jinzhe Zeng and Yujun Tao and Timothy J Giese and Darrin M York},
-    title =    {{QD{\pi}: A Quantum Deep Potential Interaction Model for
-             Drug Discovery}},
-    journal =  {J. Chem. Theory Comput.},
-    year =     2023,
-    volume = 19,
-    issue = 4,
-    pages = {1261--1275},
-    doi =      {10.1021/acs.jctc.2c01172},
-}
-
-@Article{Zeng_PhysRevB_2022_v105_p174109,
-    annote = {fit density of states},
-    author =   {Qiyu Zeng and Bo Chen and Xiaoxiang Yu and Shen Zhang and Dongdong
-             Kang and Han Wang and Jiayu Dai},
-    title =    {{Towards large-scale and spatiotemporally resolved diagnosis of
-             electronic density of states by deep learning}},
-    journal =  {Phys. Rev. B},
-    year =     2022,
-    volume =   105,
-    issue =    17,
-    pages =    174109,
-    doi =      {10.1103/PhysRevB.105.174109},
-}
-
-@Article{Zhang_JChemPhys_2022_v156_p124107,
-    annote =     {DPLR, se_e2_r, hybrid descriptor},
-    author =   {Linfeng Zhang and Han Wang and Maria Carolina Muniz and Athanassios Z
-             Panagiotopoulos and Roberto Car and Weinan E},
-    title =    {{A deep potential model with long-range electrostatic interactions}},
-    journal =  {J. Chem. Phys.},
-    year =     2022,
-    volume =   156,
-    issue =    12,
-    pages =    124107,
-    doi =      {10.1063/5.0083669},
-}
-
-@article{Zeng_JChemTheoryComput_2021_v17_p6993,
-    annote= {DPRc},
-    title={{Development of Range-Corrected Deep Learning Potentials for Fast, Accurate Quantum Mechanical/molecular Mechanical Simulations of Chemical Reactions in Solution}},
-    author={Zeng, Jinzhe and Giese, Timothy J and Ekesan, {\c{S}}{\"o}len and York, Darrin M},
-    journal={J. Chem. Theory Comput.},
-    year=2021,
-    volume=17,
-    issue=11,
-    pages={6993-7009},
-    doi = {10.1021/acs.jctc.1c00201},
-}
-
-@article{Wang_ApplPhysLett_2019_v114_p244101,
-    annote = {Interpolation with a pair-wise potential},
-    title={{Deep learning inter-atomic potential model for accurate irradiation damage simulations}},
-    author={Wang, Hao and Guo, Xun and Zhang, Linfeng and Wang, Han and Xue, Jianming},
-    journal={Appl. Phys. Lett.},
-    volume={114},
-    number={24},
-    pages={244101},
-    year={2019},
-    publisher={AIP Publishing LLC},
-    doi={10.1063/1.5098061},
-}
-
-@article{Zhang_PhysRevMater_2019_v3_p23804,
-    annote = {model deviation},
-    title = {{Active learning of uniformly accurate interatomic potentials for materials simulation}},
-    author = {Linfeng Zhang and De-Ye Lin and Han Wang and Roberto Car and Weinan E},
-    journal = {Phys. Rev. Mater.},
-    volume = 3,
-    issue = 2,
-    pages = 23804,
-    year = 2019,
-    publisher = {American Physical Society},
-    doi = {10.1103/PhysRevMaterials.3.023804},
-}
-
-@article{Lu_JChemTheoryComput_2022_v18_p5555,
-    annote = {DP Compress},
-    author =   {Denghui Lu and Wanrun Jiang and Yixiao Chen and Linfeng Zhang and
-             Weile Jia and Han Wang and Mohan Chen},
-    title =    {{DP Compress: A Model Compression Scheme for Generating Efficient Deep
-             Potential Models}},
-    journal =  {J. Chem. Theory Comput.},
-    year =     2022,
-    volume=18,
-    issue=9,
-    pages={5555--5567},
-    doi =      {10.1021/acs.jctc.2c00102},
-}
-
-@article{Mo_npjComputMater_2022_v8_p107,
-    annote =   {NVNMD},
-    author =   {Pinghui Mo and Chang Li and Dan Zhao and Yujia Zhang and Mengchao Shi
-             and Junhua Li and Jie Liu},
-    title =    {{Accurate and efficient molecular dynamics based on machine learning
-             and non von Neumann architecture}},
-    journal =  {npj Comput. Mater.},
-    year =     2022,
-    volume =   8,
-    issue =    1,
-    pages =    107,
-    doi =      {10.1038/s41524-022-00773-z},
-}
-
-@article{Zeng_EnergyFuels_2021_v35_p762,
-    annote = {relative or atomic model deviation},
-    author = {Jinzhe Zeng and Linfeng Zhang and Han Wang and Tong Zhu},
-    title = {{Exploring the Chemical Space of Linear Alkane Pyrolysis via Deep Potential GENerator}},
-    journal = {Energy \& Fuels},
-    volume = 35,
-    number = 1,
-    pages = {762--769},
-    year = 2021,
-    doi = {10.1021/acs.energyfuels.0c03211},
-}
+The proposed feature of each article is described in the "annote" field.
+Please cite a article if any feature is used
+@article{Wang_ComputPhysCommun_2018_v228_p178,
+  annote       = {general purpose},
+  author       = {Wang, Han and Zhang, Linfeng and Han, Jiequn and E, Weinan},
+  doi          = {10.1016/j.cpc.2018.03.016},
+  year         = 2018,
+  month        = {jul},
+  publisher    = {Elsevier {BV}},
+  volume       = 228,
+  journal      = {Comput. Phys. Comm.},
+  title        = {
+    {DeePMD-kit: A deep learning package for many-body potential energy
+    representation and molecular dynamics}
+  },
+  pages        = {178--184},
+}
+
+@article{Zeng_JChemPhys_2023_v159_p054801,
+  annote       = {general purpose},
+  title        = {{DeePMD-kit v2: A software package for deep potential models}},
+  author       = {
+    Jinzhe Zeng and Duo Zhang and Denghui Lu and Pinghui Mo and Zeyu Li and
+    Yixiao Chen and Mari{\'a}n Rynik and Li'ang Huang and Ziyao Li and Shaochen
+    Shi and Yingze Wang and Haotian Ye and Ping Tuo and Jiabin Yang and Ye Ding
+    and Yifan Li and Davide Tisi and Qiyu Zeng and Han Bao and Yu Xia and
+    Jiameng Huang and Koki Muraoka and Yibo Wang and Junhan Chang and Fengbo
+    Yuan and Sigbj{\o}rn L{\o}land Bore and Chun Cai and Yinnian Lin and Bo
+    Wang and Jiayan Xu and Jia-Xin Zhu and Chenxing Luo and Yuzhi Zhang and
+    Rhys E A Goodall and Wenshuo Liang and Anurag Kumar Singh and Sikai Yao and
+    Jingchao Zhang and Renata Wentzcovitch and Jiequn Han and Jie Liu and Weile
+    Jia and Darrin M York and Weinan E and Roberto Car and Linfeng Zhang and
+    Han Wang
+  },
+  journal      = {J. Chem. Phys.},
+  volume       = 159,
+  issue        = 5,
+  year         = 2023,
+  pages        = 054801,
+  doi          = {10.1063/5.0155600},
+}
+
+@article{Lu_CompPhysCommun_2021_v259_p107624,
+  annote       = {GPU support},
+  title        = {
+    {86 PFLOPS Deep Potential Molecular Dynamics simulation of 100 million
+    atoms with ab initio accuracy}
+  },
+  author       = {
+    Lu, Denghui and Wang, Han and Chen, Mohan and Lin, Lin and Car, Roberto and
+    E, Weinan and Jia, Weile and Zhang, Linfeng
+  },
+  journal      = {Comput. Phys. Comm.},
+  volume       = 259,
+  pages        = 107624,
+  year         = 2021,
+  publisher    = {Elsevier},
+  doi          = {10.1016/j.cpc.2020.107624},
+}
+
+@article{Zhang_PhysRevLett_2018_v120_p143001,
+  annote       = {local frame (loc\_frame)},
+  author       = {Linfeng Zhang and Jiequn Han and Han Wang and Roberto Car and Weinan E},
+  journal      = {Phys. Rev. Lett.},
+  number       = 14,
+  pages        = 143001,
+  publisher    = {APS},
+  title        = {
+    {Deep potential molecular dynamics: a scalable model with the accuracy of
+    quantum mechanics}
+  },
+  volume       = 120,
+  year         = 2018,
+  doi          = {10.1103/PhysRevLett.120.143001},
+}
+
+@incollection{Zhang_BookChap_NIPS_2018_v31_p4436,
+  annote       = {DeepPot-SE (se\_e2\_a, se\_e2\_r, se\_e3, se\_atten)},
+  title        = {
+    {End-to-end Symmetry Preserving Inter-atomic Potential Energy Model for
+    Finite and Extended Systems}
+  },
+  author       = {
+    Zhang, Linfeng and Han, Jiequn and Wang, Han and Saidi, Wissam and Car,
+    Roberto and E, Weinan
+  },
+  booktitle    = {Advances in Neural Information Processing Systems 31},
+  editor       = {
+    S. Bengio and H. Wallach and H. Larochelle and K. Grauman and N.
+    Cesa-Bianchi and R. Garnett
+  },
+  pages        = {4436--4446},
+  year         = 2018,
+  publisher    = {Curran Associates, Inc.},
+  url          = {https://dl.acm.org/doi/10.5555/3327345.3327356},
+}
+
+@article{Wang_NuclFusion_2022_v62_p126013,
+  annote       = {three-body embedding DeepPot-SE (se\_e3)},
+  author       = {Xiaoyang Wang and Yinan Wang and Linfeng Zhang and Fuzhi Dai and Han Wang},
+  title        = {
+    {A tungsten deep neural-network potential for simulating mechanical
+    property degradation under fusion service environment}
+  },
+  journal      = {Nucl. Fusion},
+  year         = 2022,
+  volume       = 62,
+  issue        = 12,
+  pages        = 126013,
+  doi          = {10.1088/1741-4326/ac888b},
+}
+
+@article{Zhang_NpjComputMater_2024_v10_p94,
+  annote       = {DPA-1, attention-based descriptor},
+  author       = {
+    Duo Zhang and Hangrui Bi and Fu-Zhi Dai and Wanrun Jiang and Xinzijian Liu
+    and Linfeng Zhang and Han Wang
+  },
+  title        = {
+    {Pretraining of attention-based deep learning potential model for molecular
+    simulation}
+  },
+  journal      = {Npj Comput. Mater},
+  year         = 2024,
+  volume       = 10,
+  issue        = 1,
+  pages        = 94,
+  doi          = {10.1038/s41524-024-01278-7},
+}
+
+@article{Zhang_PhysPlasmas_2020_v27_p122704,
+  annote       = {frame-specific parameters (e.g. electronic temperature)},
+  author       = {
+    Zhang, Yuzhi and Gao, Chang and Liu, Qianrui and Zhang, Linfeng and Wang,
+    Han and Chen, Mohan
+  },
+  title        = {
+    {Warm dense matter simulation via electron temperature dependent deep
+    potential molecular dynamics}
+  },
+  journal      = {Phys. Plasmas},
+  volume       = 27,
+  number       = 12,
+  pages        = 122704,
+  year         = 2020,
+  month        = 12,
+  doi          = {10.1063/5.0023265},
+}
+
+@misc{Zeng_2023_TTMDPMD,
+  annote       = {atom-specific parameter (e.g. electron temperature)},
+  author       = {
+    Zeng, Qiyu and Chen, Bo and Zhang, Shen and Kang, Dongdong and Wang, Han
+    and Yu, Xiaoxiang and Dai, Jiayu
+  },
+  title        = {{Full-scale ab initio simulations of laser-driven atomistic dynamics}},
+  publisher    = {arXiv},
+  year         = 2023,
+  doi          = {10.48550/arXiv.2308.13863},
+}
+
+@article{Zhang_PhysRevB_2020_v102_p41121,
+  annote       = {fit dipole},
+  title        = {{Deep neural network for the dielectric response of insulators}},
+  author       = {
+    Zhang, Linfeng and Chen, Mohan and Wu, Xifan and Wang, Han and E, Weinan
+    and Car, Roberto
+  },
+  journal      = {Phys. Rev. B},
+  volume       = 102,
+  number       = 4,
+  pages        = {041121},
+  year         = 2020,
+  publisher    = {APS},
+  doi          = {10.1103/PhysRevB.102.041121},
+}
+
+@article{Sommers_PhysChemChemPhys_2020_v22_p10592,
+  annote       = {fit polarizability},
+  title        = {
+    {Raman spectrum and polarizability of liquid water from deep neural
+    networks}
+  },
+  author       = {
+    Sommers, Grace M and Andrade, Marcos F Calegari and Zhang, Linfeng and
+    Wang, Han and Car, Roberto
+  },
+  journal      = {Phys. Chem. Chem. Phys.},
+  volume       = 22,
+  number       = 19,
+  pages        = {10592--10602},
+  year         = 2020,
+  publisher    = {Royal Society of Chemistry},
+  doi          = {10.1039/D0CP01893G},
+}
+
+@article{Zeng_JChemTheoryComput_2023_v19_p1261,
+  annote       = {fit relative energies},
+  author       = {Jinzhe Zeng and Yujun Tao and Timothy J Giese and Darrin M York},
+  title        = {{QD{\pi}: A Quantum Deep Potential Interaction Model for Drug Discovery}},
+  journal      = {J. Chem. Theory Comput.},
+  year         = 2023,
+  volume       = 19,
+  issue        = 4,
+  pages        = {1261--1275},
+  doi          = {10.1021/acs.jctc.2c01172},
+}
+
+@article{Zeng_PhysRevB_2022_v105_p174109,
+  annote       = {fit density of states},
+  author       = {
+    Qiyu Zeng and Bo Chen and Xiaoxiang Yu and Shen Zhang and Dongdong Kang and
+    Han Wang and Jiayu Dai
+  },
+  title        = {
+    {Towards large-scale and spatiotemporally resolved diagnosis of electronic
+    density of states by deep learning}
+  },
+  journal      = {Phys. Rev. B},
+  year         = 2022,
+  volume       = 105,
+  issue        = 17,
+  pages        = 174109,
+  doi          = {10.1103/PhysRevB.105.174109},
+}
+
+@article{Zhang_JChemPhys_2022_v156_p124107,
+  annote       = {DPLR, se\_e2\_r, hybrid descriptor},
+  author       = {
+    Linfeng Zhang and Han Wang and Maria Carolina Muniz and Athanassios Z
+    Panagiotopoulos and Roberto Car and Weinan E
+  },
+  title        = {{A deep potential model with long-range electrostatic interactions}},
+  journal      = {J. Chem. Phys.},
+  year         = 2022,
+  volume       = 156,
+  issue        = 12,
+  pages        = 124107,
+  doi          = {10.1063/5.0083669},
+}
+
+@article{Zeng_JChemTheoryComput_2021_v17_p6993,
+  annote       = {DPRc},
+  title        = {
+    {Development of Range-Corrected Deep Learning Potentials for Fast, Accurate
+    Quantum Mechanical/molecular Mechanical Simulations of Chemical Reactions
+    in Solution}
+  },
+  author       = {
+    Zeng, Jinzhe and Giese, Timothy J and Ekesan, {\c{S}}{\"o}len and York,
+    Darrin M
+  },
+  journal      = {J. Chem. Theory Comput.},
+  year         = 2021,
+  volume       = 17,
+  issue        = 11,
+  pages        = {6993--7009},
+  doi          = {10.1021/acs.jctc.1c00201},
+}
+
+@article{Wang_ApplPhysLett_2019_v114_p244101,
+  annote       = {Interpolation with a pair-wise potential},
+  title        = {
+    {Deep learning inter-atomic potential model for accurate irradiation damage
+    simulations}
+  },
+  author       = {Wang, Hao and Guo, Xun and Zhang, Linfeng and Wang, Han and Xue, Jianming},
+  journal      = {Appl. Phys. Lett.},
+  volume       = 114,
+  number       = 24,
+  pages        = 244101,
+  year         = 2019,
+  publisher    = {AIP Publishing LLC},
+  doi          = {10.1063/1.5098061},
+}
+
+@article{Zhang_PhysRevMater_2019_v3_p23804,
+  annote       = {model deviation},
+  title        = {
+    {Active learning of uniformly accurate interatomic potentials for materials
+    simulation}
+  },
+  author       = {Linfeng Zhang and De-Ye Lin and Han Wang and Roberto Car and Weinan E},
+  journal      = {Phys. Rev. Mater.},
+  volume       = 3,
+  issue        = 2,
+  pages        = 23804,
+  year         = 2019,
+  publisher    = {American Physical Society},
+  doi          = {10.1103/PhysRevMaterials.3.023804},
+}
+
+@article{Lu_JChemTheoryComput_2022_v18_p5555,
+  annote       = {DP Compress},
+  author       = {
+    Denghui Lu and Wanrun Jiang and Yixiao Chen and Linfeng Zhang and Weile Jia
+    and Han Wang and Mohan Chen
+  },
+  title        = {
+    {DP Compress: A Model Compression Scheme for Generating Efficient Deep
+    Potential Models}
+  },
+  journal      = {J. Chem. Theory Comput.},
+  year         = 2022,
+  volume       = 18,
+  issue        = 9,
+  pages        = {5555--5567},
+  doi          = {10.1021/acs.jctc.2c00102},
+}
+
+@article{Mo_npjComputMater_2022_v8_p107,
+  annote       = {NVNMD},
+  author       = {
+    Pinghui Mo and Chang Li and Dan Zhao and Yujia Zhang and Mengchao Shi and
+    Junhua Li and Jie Liu
+  },
+  title        = {
+    {Accurate and efficient molecular dynamics based on machine learning and
+    non von Neumann architecture}
+  },
+  journal      = {npj Comput. Mater.},
+  year         = 2022,
+  volume       = 8,
+  issue        = 1,
+  pages        = 107,
+  doi          = {10.1038/s41524-022-00773-z},
+}
+
+@article{Zeng_EnergyFuels_2021_v35_p762,
+  annote       = {relative or atomic model deviation},
+  author       = {Jinzhe Zeng and Linfeng Zhang and Han Wang and Tong Zhu},
+  title        = {
+    {Exploring the Chemical Space of Linear Alkane Pyrolysis via Deep Potential
+    GENerator}
+  },
+  journal      = {Energy \& Fuels},
+  volume       = 35,
+  number       = 1,
+  pages        = {762--769},
+  year         = 2021,
+  doi          = {10.1021/acs.energyfuels.0c03211},
+}
diff --git a/backend/find_tensorflow.py b/backend/find_tensorflow.py
index a4edfa313d..522ac9044f 100644
--- a/backend/find_tensorflow.py
+++ b/backend/find_tensorflow.py
@@ -149,12 +149,19 @@ def get_tf_requirement(tf_version: str = "") -> dict:
                 "tensorflow-cpu; platform_machine!='aarch64' and (platform_machine!='arm64' or platform_system != 'Darwin')",
                 "tensorflow; platform_machine=='aarch64' or (platform_machine=='arm64' and platform_system == 'Darwin')",
                 # https://github.com/tensorflow/tensorflow/issues/61830
-                "tensorflow-cpu<2.15; platform_system=='Windows'",
+                "tensorflow-cpu!=2.15.*; platform_system=='Windows'",
+                # TODO: build(wheel): unpin h5py on aarch64
+                # Revert after https://github.com/h5py/h5py/issues/2408 is fixed;
+                # or set UV_PREFER_BINARY when https://github.com/astral-sh/uv/issues/1794 is resolved.
+                # 3.6.0 is the first version to have aarch64 wheels.
+                "h5py>=3.6.0,<3.11.0; platform_system=='Linux' and platform_machine=='aarch64'",
                 *extra_requires,
             ],
             "gpu": [
                 "tensorflow",
                 "tensorflow-metal; platform_machine=='arm64' and platform_system == 'Darwin'",
+                # See above.
+                "h5py>=3.6.0,<3.11.0; platform_system=='Linux' and platform_machine=='aarch64'",
                 *extra_requires,
             ],
             **extra_select,
diff --git a/backend/read_env.py b/backend/read_env.py
index 079211d4d7..06f6f0c7e2 100644
--- a/backend/read_env.py
+++ b/backend/read_env.py
@@ -60,7 +60,7 @@ def get_argument_from_env() -> Tuple[str, list, list, dict, str]:
         if hipcc_flags is not None:
             os.environ["HIPFLAGS"] = os.environ.get("HIPFLAGS", "") + " " + hipcc_flags
     else:
-        raise RuntimeError("Unsupported DP_VARIANT option: %s" % dp_variant)
+        raise RuntimeError(f"Unsupported DP_VARIANT option: {dp_variant}")
 
     if os.environ.get("DP_BUILD_TESTING", "0") == "1":
         cmake_args.append("-DBUILD_TESTING:BOOL=TRUE")
diff --git a/data/raw/copy_raw.py b/data/raw/copy_raw.py
index 69ccdf5c63..2a4078df4d 100755
--- a/data/raw/copy_raw.py
+++ b/data/raw/copy_raw.py
@@ -85,7 +85,7 @@ def _main():
     )
     args = parser.parse_args()
 
-    print("# copy the system by %s copies" % args.ncopies)  # noqa: T201
+    print(f"# copy the system by {args.ncopies} copies")  # noqa: T201
     assert np.all(
         np.array(args.ncopies, dtype=int) >= np.array([1, 1, 1], dtype=int)
     ), "number of copies should be larger than or equal to 1"
diff --git a/deepmd/cluster/local.py b/deepmd/cluster/local.py
index 3c12c9dc85..694f6b8b56 100644
--- a/deepmd/cluster/local.py
+++ b/deepmd/cluster/local.py
@@ -43,7 +43,7 @@ def get_gpus():
         stdout, stderr = p.communicate()
         if p.returncode != 0:
             decoded = stderr.decode("UTF-8")
-            raise RuntimeError("Failed to detect availbe GPUs due to:\n%s" % decoded)
+            raise RuntimeError(f"Failed to detect availbe GPUs due to:\n{decoded}")
         decoded = stdout.decode("UTF-8").strip()
         num_gpus = int(decoded)
         return list(range(num_gpus)) if num_gpus > 0 else None
diff --git a/deepmd/descriptor/descriptor.py b/deepmd/descriptor/descriptor.py
index bd731004cb..3e3115b9dd 100644
--- a/deepmd/descriptor/descriptor.py
+++ b/deepmd/descriptor/descriptor.py
@@ -8,6 +8,7 @@
     Dict,
     List,
     Optional,
+    Set,
     Tuple,
 )
 
@@ -282,7 +283,7 @@ def enable_compression(
         This method is called by others when the descriptor supported compression.
         """
         raise NotImplementedError(
-            "Descriptor %s doesn't support compression!" % type(self).__name__
+            f"Descriptor {type(self).__name__} doesn't support compression!"
         )
 
     def enable_mixed_precision(self, mixed_prec: Optional[dict] = None) -> None:
@@ -298,8 +299,7 @@ def enable_mixed_precision(self, mixed_prec: Optional[dict] = None) -> None:
         This method is called by others when the descriptor supported compression.
         """
         raise NotImplementedError(
-            "Descriptor %s doesn't support mixed precision training!"
-            % type(self).__name__
+            f"Descriptor {type(self).__name__} doesn't support mixed precision training!"
         )
 
     @abstractmethod
@@ -350,8 +350,7 @@ def init_variables(
         This method is called by others when the descriptor supported initialization from the given variables.
         """
         raise NotImplementedError(
-            "Descriptor %s doesn't support initialization from the given variables!"
-            % type(self).__name__
+            f"Descriptor {type(self).__name__} doesn't support initialization from the given variables!"
         )
 
     def get_tensor_names(self, suffix: str = "") -> Tuple[str]:
@@ -368,7 +367,7 @@ def get_tensor_names(self, suffix: str = "") -> Tuple[str]:
             Names of tensors
         """
         raise NotImplementedError(
-            "Descriptor %s doesn't support this property!" % type(self).__name__
+            f"Descriptor {type(self).__name__} doesn't support this property!"
         )
 
     def pass_tensors_from_frz_model(
@@ -388,12 +387,12 @@ def pass_tensors_from_frz_model(
         :meth:`get_tensor_names`.
         """
         raise NotImplementedError(
-            "Descriptor %s doesn't support this method!" % type(self).__name__
+            f"Descriptor {type(self).__name__} doesn't support this method!"
         )
 
     def build_type_exclude_mask(
         self,
-        exclude_types: List[Tuple[int, int]],
+        exclude_types: Set[Tuple[int, int]],
         ntypes: int,
         sel: List[int],
         ndescrpt: int,
diff --git a/deepmd/descriptor/loc_frame.py b/deepmd/descriptor/loc_frame.py
index ccb66c864d..410cd038ac 100644
--- a/deepmd/descriptor/loc_frame.py
+++ b/deepmd/descriptor/loc_frame.py
@@ -427,12 +427,8 @@ def init_variables(
         suffix : str, optional
             The suffix of the scope
         """
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     @classmethod
     def update_sel(cls, global_jdata: dict, local_jdata: dict):
diff --git a/deepmd/descriptor/se.py b/deepmd/descriptor/se.py
index 598f6f9ff8..064e1c3bf2 100644
--- a/deepmd/descriptor/se.py
+++ b/deepmd/descriptor/se.py
@@ -130,12 +130,8 @@ def init_variables(
         self.embedding_net_variables = get_embedding_net_variables_from_graph_def(
             graph_def, suffix=suffix
         )
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     @property
     def precision(self) -> tf.DType:
diff --git a/deepmd/descriptor/se_a.py b/deepmd/descriptor/se_a.py
index 3a924f796a..f3e62d3672 100644
--- a/deepmd/descriptor/se_a.py
+++ b/deepmd/descriptor/se_a.py
@@ -274,6 +274,18 @@ def __init__(
                 sel_a=self.sel_a,
                 sel_r=self.sel_r,
             )
+            if len(self.exclude_types):
+                # exclude types applied to data stat
+                mask = self.build_type_exclude_mask(
+                    self.exclude_types,
+                    self.ntypes,
+                    self.sel_a,
+                    self.ndescrpt,
+                    # for data stat, nloc == nall
+                    self.place_holders["type"],
+                    tf.size(self.place_holders["type"]),
+                )
+                self.stat_descrpt *= tf.reshape(mask, tf.shape(self.stat_descrpt))
         self.sub_sess = tf.Session(graph=sub_graph, config=default_tf_session_config)
         self.original_sel = None
         self.multi_task = multi_task
@@ -528,12 +540,8 @@ def enable_compression(
             min_nbor_dist, table_extrapolate, table_stride_1, table_stride_2
         )
 
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     def enable_mixed_precision(self, mixed_prec: Optional[dict] = None) -> None:
         """Reveive the mixed precision setting.
@@ -1279,14 +1287,14 @@ def init_variables(
         super().init_variables(graph=graph, graph_def=graph_def, suffix=suffix)
         try:
             self.original_sel = get_tensor_by_name_from_graph(
-                graph, "descrpt_attr%s/original_sel" % suffix
+                graph, f"descrpt_attr{suffix}/original_sel"
             )
         except GraphWithoutTensorError:
             # original_sel is not restored in old graphs, assume sel never changed before
             pass
         # check sel == original sel?
         try:
-            sel = get_tensor_by_name_from_graph(graph, "descrpt_attr%s/sel" % suffix)
+            sel = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/sel")
         except GraphWithoutTensorError:
             # sel is not restored in old graphs
             pass
diff --git a/deepmd/descriptor/se_a_mask.py b/deepmd/descriptor/se_a_mask.py
index d573755ea5..c5770721f6 100644
--- a/deepmd/descriptor/se_a_mask.py
+++ b/deepmd/descriptor/se_a_mask.py
@@ -307,8 +307,9 @@ def build(
         aparam[:, :] is the real/virtual sign for each atom.
         """
         aparam = input_dict["aparam"]
-        with tf.variable_scope("fitting_attr" + suffix, reuse=reuse):
-            t_aparam_nall = tf.constant(True, name="aparam_nall", dtype=tf.bool)
+        t_aparam_nall = tf.constant(
+            True, name=f"fitting_attr{suffix}/aparam_nall", dtype=tf.bool
+        )
         self.mask = tf.cast(aparam, tf.int32)
         self.mask = tf.reshape(self.mask, [-1, natoms[1]])
 
diff --git a/deepmd/descriptor/se_atten.py b/deepmd/descriptor/se_atten.py
index 8c1a179923..5615863254 100644
--- a/deepmd/descriptor/se_atten.py
+++ b/deepmd/descriptor/se_atten.py
@@ -4,6 +4,7 @@
 from typing import (
     List,
     Optional,
+    Set,
     Tuple,
 )
 
@@ -117,7 +118,7 @@ class DescrptSeAtten(DescrptSeA):
     stripped_type_embedding
             Whether to strip the type embedding into a separated embedding network.
             Default value will be True in `se_atten_v2` descriptor.
-    smooth_type_embdding
+    smooth_type_embedding
             When using stripped type embedding, whether to dot smooth factor on the network output of type embedding
             to keep the network smooth, instead of setting `set_davg_zero` to be True.
             Default value will be True in `se_atten_v2` descriptor.
@@ -151,10 +152,12 @@ def __init__(
         attn_mask: bool = False,
         multi_task: bool = False,
         stripped_type_embedding: bool = False,
-        smooth_type_embdding: bool = False,
+        smooth_type_embedding: bool = False,
         **kwargs,
     ) -> None:
-        if not set_davg_zero and not (stripped_type_embedding and smooth_type_embdding):
+        if not set_davg_zero and not (
+            stripped_type_embedding and smooth_type_embedding
+        ):
             warnings.warn(
                 "Set 'set_davg_zero' False in descriptor 'se_atten' "
                 "may cause unexpected incontinuity during model inference!"
@@ -187,7 +190,7 @@ def __init__(
         if ntypes == 0:
             raise ValueError("`model/type_map` is not set or empty!")
         self.stripped_type_embedding = stripped_type_embedding
-        self.smooth = smooth_type_embdding
+        self.smooth = smooth_type_embedding
         self.ntypes = ntypes
         self.att_n = attn
         self.attn_layer = attn_layer
@@ -250,6 +253,19 @@ def __init__(
                 sel_a=self.sel_all_a,
                 sel_r=self.sel_all_r,
             )
+            if len(self.exclude_types):
+                # exclude types applied to data stat
+                mask = self.build_type_exclude_mask_mixed(
+                    self.exclude_types,
+                    self.ntypes,
+                    self.sel_a,
+                    self.ndescrpt,
+                    # for data stat, nloc == nall
+                    self.place_holders["type"],
+                    tf.size(self.place_holders["type"]),
+                    self.nei_type_vec_t,  # extra input for atten
+                )
+                self.stat_descrpt *= tf.reshape(mask, tf.shape(self.stat_descrpt))
         self.sub_sess = tf.Session(graph=sub_graph, config=default_tf_session_config)
 
     def compute_input_stats(
@@ -431,12 +447,8 @@ def enable_compression(
         )
         self.two_embd = make_data(self, self.final_type_embedding)
 
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     def build(
         self,
@@ -640,7 +652,7 @@ def _pass_filter(
         inputs_i = tf.reshape(inputs_i, [-1, self.ndescrpt])
         type_i = -1
         if len(self.exclude_types):
-            mask = self.build_type_exclude_mask(
+            mask = self.build_type_exclude_mask_mixed(
                 self.exclude_types,
                 self.ntypes,
                 self.sel_a,
@@ -658,6 +670,14 @@ def _pass_filter(
                         tf.reshape(self.avg_looked_up, [-1, 1]), [1, self.ndescrpt]
                     ),
                 )
+                self.recovered_switch *= tf.reshape(
+                    tf.slice(
+                        tf.reshape(tf.cast(mask, self.filter_precision), [-1, 4]),
+                        [0, 0],
+                        [-1, 1],
+                    ),
+                    [-1, natoms[0], self.sel_all_a[0]],
+                )
             else:
                 inputs_i *= mask
         if nvnmd_cfg.enable and nvnmd_cfg.quantize_descriptor:
@@ -1335,9 +1355,9 @@ def init_variables(
                 )
             )
 
-    def build_type_exclude_mask(
+    def build_type_exclude_mask_mixed(
         self,
-        exclude_types: List[Tuple[int, int]],
+        exclude_types: Set[Tuple[int, int]],
         ntypes: int,
         sel: List[int],
         ndescrpt: int,
diff --git a/deepmd/descriptor/se_atten_v2.py b/deepmd/descriptor/se_atten_v2.py
index 784e02d84d..01c4d93ad8 100644
--- a/deepmd/descriptor/se_atten_v2.py
+++ b/deepmd/descriptor/se_atten_v2.py
@@ -110,6 +110,6 @@ def __init__(
             attn_mask=attn_mask,
             multi_task=multi_task,
             stripped_type_embedding=True,
-            smooth_type_embdding=True,
+            smooth_type_embedding=True,
             **kwargs,
         )
diff --git a/deepmd/descriptor/se_r.py b/deepmd/descriptor/se_r.py
index 062fd3c8a6..d5f8e59d18 100644
--- a/deepmd/descriptor/se_r.py
+++ b/deepmd/descriptor/se_r.py
@@ -185,6 +185,18 @@ def __init__(
                 rcut_smth=self.rcut_smth,
                 sel=self.sel_r,
             )
+            if len(self.exclude_types):
+                # exclude types applied to data stat
+                mask = self.build_type_exclude_mask(
+                    self.exclude_types,
+                    self.ntypes,
+                    self.sel_r,
+                    self.ndescrpt,
+                    # for data stat, nloc == nall
+                    self.place_holders["type"],
+                    tf.size(self.place_holders["type"]),
+                )
+                self.stat_descrpt *= tf.reshape(mask, tf.shape(self.stat_descrpt))
             self.sub_sess = tf.Session(
                 graph=sub_graph, config=default_tf_session_config
             )
@@ -353,12 +365,8 @@ def enable_compression(
             min_nbor_dist, table_extrapolate, table_stride_1, table_stride_2
         )
 
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     def build(
         self,
diff --git a/deepmd/descriptor/se_t.py b/deepmd/descriptor/se_t.py
index 86e5ca6a1e..906ca144c4 100644
--- a/deepmd/descriptor/se_t.py
+++ b/deepmd/descriptor/se_t.py
@@ -368,12 +368,8 @@ def enable_compression(
             min_nbor_dist, table_extrapolate, table_stride_1 * 10, table_stride_2 * 10
         )
 
-        self.davg = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_avg" % suffix
-        )
-        self.dstd = get_tensor_by_name_from_graph(
-            graph, "descrpt_attr%s/t_std" % suffix
-        )
+        self.davg = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_avg")
+        self.dstd = get_tensor_by_name_from_graph(graph, f"descrpt_attr{suffix}/t_std")
 
     def build(
         self,
diff --git a/deepmd/entrypoints/compress.py b/deepmd/entrypoints/compress.py
index 61d6dfcb44..85f5ed4e74 100644
--- a/deepmd/entrypoints/compress.py
+++ b/deepmd/entrypoints/compress.py
@@ -101,11 +101,10 @@ def compress(
     except GraphWithoutTensorError as e:
         if training_script is None:
             raise RuntimeError(
-                "The input frozen model: %s has no training script or min_nbor_dist information, "
+                f"The input frozen model: {input} has no training script or min_nbor_dist information, "
                 "which is not supported by the model compression interface. "
                 "Please consider using the --training-script command within the model compression interface to provide the training script of the input frozen model. "
                 "Note that the input training script must contain the correct path to the training data."
-                % input
             ) from e
         elif not os.path.exists(training_script):
             raise RuntimeError(
@@ -160,10 +159,10 @@ def compress(
         )
     except GraphTooLargeError as e:
         raise RuntimeError(
-            "The uniform step size of the tabulation's first table is %f, "
+            f"The uniform step size of the tabulation's first table is {step:f}, "
             "which is too small. This leads to a very large graph size, "
             "exceeding protobuf's limitation (2 GB). You should try to "
-            "increase the step size." % step
+            "increase the step size."
         ) from e
 
     # reset the graph, otherwise the size limitation will be only 2 GB / 2 = 1 GB
@@ -176,10 +175,10 @@ def compress(
         freeze(checkpoint_folder=checkpoint_folder, output=output, node_names=None)
     except GraphTooLargeError as e:
         raise RuntimeError(
-            "The uniform step size of the tabulation's first table is %f, "
+            f"The uniform step size of the tabulation's first table is {step:f}, "
             "which is too small. This leads to a very large graph size, "
             "exceeding protobuf's limitation (2 GB). You should try to "
-            "increase the step size." % step
+            "increase the step size."
         ) from e
 
 
diff --git a/deepmd/entrypoints/freeze.py b/deepmd/entrypoints/freeze.py
index 543e89b4ab..ddb9d3cf68 100755
--- a/deepmd/entrypoints/freeze.py
+++ b/deepmd/entrypoints/freeze.py
@@ -357,13 +357,21 @@ def freeze_graph(
     output_node = _make_node_names(
         freeze_type, modifier, out_suffix=out_suffix, node_names=node_names
     )
+    # see #3334
+    optional_node = [
+        "train_attr/min_nbor_dist",
+        "fitting_attr/aparam_nall",
+        "spin_attr/ntypes_spin",
+    ]
     different_set = set(output_node) - set(input_node)
     if different_set:
-        log.warning(
-            "The following nodes are not in the graph: %s. "
-            "Skip freezeing these nodes. You may be freezing "
-            "a checkpoint generated by an old version." % different_set
-        )
+        different_set -= set(optional_node)
+        if different_set:
+            log.warning(
+                f"The following nodes are not in the graph: {different_set}. "
+                "Skip freezeing these nodes. You may be freezing "
+                "a checkpoint generated by an old version."
+            )
         # use intersection as output list
         output_node = list(set(output_node) & set(input_node))
     log.info(f"The following nodes will be frozen: {output_node}")
diff --git a/deepmd/entrypoints/neighbor_stat.py b/deepmd/entrypoints/neighbor_stat.py
index 28cab00ad2..1c082322b5 100644
--- a/deepmd/entrypoints/neighbor_stat.py
+++ b/deepmd/entrypoints/neighbor_stat.py
@@ -59,6 +59,6 @@ def neighbor_stat(
     data.get_batch()
     nei = NeighborStat(data.get_ntypes(), rcut, one_type=one_type)
     min_nbor_dist, max_nbor_size = nei.get_stat(data)
-    log.info("min_nbor_dist: %f" % min_nbor_dist)
-    log.info("max_nbor_size: %s" % str(max_nbor_size))
+    log.info(f"min_nbor_dist: {min_nbor_dist:f}")
+    log.info(f"max_nbor_size: {max_nbor_size!s}")
     return min_nbor_dist, max_nbor_size
diff --git a/deepmd/entrypoints/test.py b/deepmd/entrypoints/test.py
index 7bd4883925..1a8e507639 100644
--- a/deepmd/entrypoints/test.py
+++ b/deepmd/entrypoints/test.py
@@ -410,14 +410,14 @@ def test_ener(
         save_txt_file(
             detail_path.with_suffix(".e.out"),
             pe,
-            header="%s: data_e pred_e" % system,
+            header=f"{system}: data_e pred_e",
             append=append_detail,
         )
         pe_atom = pe / natoms
         save_txt_file(
             detail_path.with_suffix(".e_peratom.out"),
             pe_atom,
-            header="%s: data_e pred_e" % system,
+            header=f"{system}: data_e pred_e",
             append=append_detail,
         )
         if dp.get_ntypes_spin() == 0:
@@ -431,7 +431,7 @@ def test_ener(
             save_txt_file(
                 detail_path.with_suffix(".f.out"),
                 pf,
-                header="%s: data_fx data_fy data_fz pred_fx pred_fy pred_fz" % system,
+                header=f"{system}: data_fx data_fy data_fz pred_fx pred_fy pred_fz",
                 append=append_detail,
             )
         else:
@@ -446,14 +446,13 @@ def test_ener(
             save_txt_file(
                 detail_path.with_suffix(".fr.out"),
                 pf_real,
-                header="%s: data_fx data_fy data_fz pred_fx pred_fy pred_fz" % system,
+                header=f"{system}: data_fx data_fy data_fz pred_fx pred_fy pred_fz",
                 append=append_detail,
             )
             save_txt_file(
                 detail_path.with_suffix(".fm.out"),
                 pf_mag,
-                header="%s: data_fmx data_fmy data_fmz pred_fmx pred_fmy pred_fmz"
-                % system,
+                header=f"{system}: data_fmx data_fmy data_fmz pred_fmx pred_fmy pred_fmz",
                 append=append_detail,
             )
         pv = np.concatenate(
diff --git a/deepmd/fit/dos.py b/deepmd/fit/dos.py
index bbf7d39a09..57059b1387 100644
--- a/deepmd/fit/dos.py
+++ b/deepmd/fit/dos.py
@@ -587,21 +587,21 @@ def init_variables(
             self.fitting_net_variables.update(shared_variables)
         if self.numb_fparam > 0:
             self.fparam_avg = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_fparam_avg" % suffix
+                graph, f"fitting_attr{suffix}/t_fparam_avg"
             )
             self.fparam_inv_std = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_fparam_istd" % suffix
+                graph, f"fitting_attr{suffix}/t_fparam_istd"
             )
         if self.numb_aparam > 0:
             self.aparam_avg = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_aparam_avg" % suffix
+                graph, f"fitting_attr{suffix}/t_aparam_avg"
             )
             self.aparam_inv_std = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_aparam_istd" % suffix
+                graph, f"fitting_attr{suffix}/t_aparam_istd"
             )
         try:
             self.bias_dos = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_bias_dos" % suffix
+                graph, f"fitting_attr{suffix}/t_bias_dos"
             )
         except GraphWithoutTensorError:
             # for compatibility, old models has no t_bias_dos
diff --git a/deepmd/fit/ener.py b/deepmd/fit/ener.py
index 4610384d7e..e417076fce 100644
--- a/deepmd/fit/ener.py
+++ b/deepmd/fit/ener.py
@@ -754,21 +754,21 @@ def init_variables(
             self.fitting_net_variables.update(shared_variables)
         if self.numb_fparam > 0:
             self.fparam_avg = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_fparam_avg" % suffix
+                graph, f"fitting_attr{suffix}/t_fparam_avg"
             )
             self.fparam_inv_std = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_fparam_istd" % suffix
+                graph, f"fitting_attr{suffix}/t_fparam_istd"
             )
         if self.numb_aparam > 0:
             self.aparam_avg = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_aparam_avg" % suffix
+                graph, f"fitting_attr{suffix}/t_aparam_avg"
             )
             self.aparam_inv_std = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_aparam_istd" % suffix
+                graph, f"fitting_attr{suffix}/t_aparam_istd"
             )
         try:
             self.bias_atom_e = get_tensor_by_name_from_graph(
-                graph, "fitting_attr%s/t_bias_atom_e" % suffix
+                graph, f"fitting_attr{suffix}/t_bias_atom_e"
             )
         except GraphWithoutTensorError:
             # for compatibility, old models has no t_bias_atom_e
diff --git a/deepmd/fit/fitting.py b/deepmd/fit/fitting.py
index a467ec1201..61af88a82b 100644
--- a/deepmd/fit/fitting.py
+++ b/deepmd/fit/fitting.py
@@ -82,8 +82,7 @@ def init_variables(
         This method is called by others when the fitting supported initialization from the given variables.
         """
         raise NotImplementedError(
-            "Fitting %s doesn't support initialization from the given variables!"
-            % type(self).__name__
+            f"Fitting {type(self).__name__} doesn't support initialization from the given variables!"
         )
 
     @abstractmethod
diff --git a/deepmd/infer/deep_pot.py b/deepmd/infer/deep_pot.py
index 81cfdde7a8..ea72d1330b 100644
--- a/deepmd/infer/deep_pot.py
+++ b/deepmd/infer/deep_pot.py
@@ -124,7 +124,7 @@ def __init__(
         # check if the graph has these operations:
         # if yes add them
 
-        if ("%s/t_efield" % load_prefix) in operations:
+        if (f"{load_prefix}/t_efield") in operations:
             self.tensors.update({"t_efield": "t_efield:0"})
             self.has_efield = True
         else:
@@ -132,7 +132,7 @@ def __init__(
             self.t_efield = None
             self.has_efield = False
 
-        if ("%s/t_fparam" % load_prefix) in operations:
+        if (f"{load_prefix}/t_fparam") in operations:
             self.tensors.update({"t_fparam": "t_fparam:0"})
             self.has_fparam = True
         else:
@@ -140,7 +140,7 @@ def __init__(
             self.t_fparam = None
             self.has_fparam = False
 
-        if ("%s/t_aparam" % load_prefix) in operations:
+        if (f"{load_prefix}/t_aparam") in operations:
             self.tensors.update({"t_aparam": "t_aparam:0"})
             self.has_aparam = True
         else:
@@ -148,7 +148,7 @@ def __init__(
             self.t_aparam = None
             self.has_aparam = False
 
-        if ("%s/spin_attr/ntypes_spin" % load_prefix) in operations:
+        if (f"{load_prefix}/spin_attr/ntypes_spin") in operations:
             self.tensors.update({"t_ntypes_spin": "spin_attr/ntypes_spin:0"})
             self.has_spin = True
         else:
diff --git a/deepmd/model/dos.py b/deepmd/model/dos.py
index 22e291a0f0..76329b5798 100644
--- a/deepmd/model/dos.py
+++ b/deepmd/model/dos.py
@@ -228,6 +228,6 @@ def init_variables(
             self.fitting.init_variables(graph, graph_def, suffix=suffix)
             tf.constant("compressed_model", name="model_type", dtype=tf.string)
         else:
-            raise RuntimeError("Unknown model type %s" % model_type)
+            raise RuntimeError(f"Unknown model type {model_type}")
         if self.typeebd is not None:
             self.typeebd.init_variables(graph, graph_def, suffix=suffix)
diff --git a/deepmd/model/ener.py b/deepmd/model/ener.py
index 0d8d66b305..7f665fe2c3 100644
--- a/deepmd/model/ener.py
+++ b/deepmd/model/ener.py
@@ -375,7 +375,7 @@ def init_variables(
             self.fitting.init_variables(graph, graph_def, suffix=suffix)
             tf.constant("compressed_model", name="model_type", dtype=tf.string)
         else:
-            raise RuntimeError("Unknown model type %s" % model_type)
+            raise RuntimeError(f"Unknown model type {model_type}")
         if (
             self.typeebd is not None
             and self.typeebd.type_embedding_net_variables is None
diff --git a/deepmd/model/model.py b/deepmd/model/model.py
index 6117b4942d..3f2fde415f 100644
--- a/deepmd/model/model.py
+++ b/deepmd/model/model.py
@@ -301,11 +301,11 @@ def build_descrpt(
         else:
             tf.constant(
                 self.rcut,
-                name="descrpt_attr%s/rcut" % suffix,
+                name=f"descrpt_attr{suffix}/rcut",
                 dtype=GLOBAL_TF_FLOAT_PRECISION,
             )
             tf.constant(
-                self.ntypes, name="descrpt_attr%s/ntypes" % suffix, dtype=tf.int32
+                self.ntypes, name=f"descrpt_attr{suffix}/ntypes", dtype=tf.int32
             )
             if "global_feed_dict" in input_dict:
                 feed_dict = input_dict["global_feed_dict"]
@@ -320,7 +320,7 @@ def build_descrpt(
                 )
             return_elements = [
                 *self.descrpt.get_tensor_names(suffix=suffix),
-                "o_descriptor%s:0" % suffix,
+                f"o_descriptor{suffix}:0",
             ]
             if frz_model is not None:
                 imported_tensors = self._import_graph_def_from_frz_model(
diff --git a/deepmd/model/tensor.py b/deepmd/model/tensor.py
index 6a21e085f3..9564e9b903 100644
--- a/deepmd/model/tensor.py
+++ b/deepmd/model/tensor.py
@@ -234,7 +234,7 @@ def init_variables(
             self.fitting.init_variables(graph, graph_def, suffix=suffix)
             tf.constant("compressed_model", name="model_type", dtype=tf.string)
         else:
-            raise RuntimeError("Unknown model type %s" % model_type)
+            raise RuntimeError(f"Unknown model type {model_type}")
 
 
 class WFCModel(TensorModel):
diff --git a/deepmd/nvnmd/entrypoints/train.py b/deepmd/nvnmd/entrypoints/train.py
index 6e14b6f865..439ebaed0a 100644
--- a/deepmd/nvnmd/entrypoints/train.py
+++ b/deepmd/nvnmd/entrypoints/train.py
@@ -126,7 +126,7 @@ def train_nvnmd(
 ):
     # test input
     if not os.path.exists(INPUT):
-        log.warning("The input script %s does not exist" % (INPUT))
+        log.warning(f"The input script {INPUT} does not exist")
     # STEP1
     PATH_CNN = "nvnmd_cnn"
     CONFIG_CNN = os.path.join(PATH_CNN, "config.npy")
diff --git a/deepmd/nvnmd/entrypoints/wrap.py b/deepmd/nvnmd/entrypoints/wrap.py
index 1ba2ed7384..868afbed93 100644
--- a/deepmd/nvnmd/entrypoints/wrap.py
+++ b/deepmd/nvnmd/entrypoints/wrap.py
@@ -137,7 +137,7 @@ def wrap(self):
             # DEVELOP_DEBUG
             if jdata_sys["debug"]:
                 log.info("%s: %d x % d bit" % (k, h, w * 4))
-                FioTxt().save("nvnmd/wrap/h%s.txt" % (k), d)
+                FioTxt().save(f"nvnmd/wrap/h{k}.txt", d)
             datas[ii] = d
         # update h & w of nvnmd_cfg
         nvnmd_cfg.size["NH_DATA"] = nhs
diff --git a/deepmd/nvnmd/utils/fio.py b/deepmd/nvnmd/utils/fio.py
index 82567e3917..3efd7520dd 100644
--- a/deepmd/nvnmd/utils/fio.py
+++ b/deepmd/nvnmd/utils/fio.py
@@ -180,7 +180,7 @@ def save(self, file_name: str, data: List[str]):
             buff.extend(list(bytearray.fromhex(si))[::-1])
         #
         with open(file_name, "wb") as fp:
-            fp.write(struct.pack("%sB" % len(buff), *buff))
+            fp.write(struct.pack(f"{len(buff)}B", *buff))
 
 
 class FioTxt:
diff --git a/deepmd/train/trainer.py b/deepmd/train/trainer.py
index 719250e7fb..d059aa84cc 100644
--- a/deepmd/train/trainer.py
+++ b/deepmd/train/trainer.py
@@ -239,7 +239,7 @@ def build(self, data=None, stop_batch=0, origin_type_map=None, suffix=""):
                     )
                 else:
                     log.info(
-                        "fitting net %s training without frame parameter" % fitting_key
+                        f"fitting net {fitting_key} training without frame parameter"
                     )
 
         if not self.is_compress:
@@ -437,8 +437,7 @@ def _build_optimizer(self, fitting_key=None):
             _TF_VERSION = Version(TF_VERSION)
             if _TF_VERSION < Version("1.14.0"):
                 raise RuntimeError(
-                    "TensorFlow version %s is not compatible with the mixed precision setting. Please consider upgrading your TF version!"
-                    % TF_VERSION
+                    f"TensorFlow version {TF_VERSION} is not compatible with the mixed precision setting. Please consider upgrading your TF version!"
                 )
             elif _TF_VERSION < Version("2.4.0"):
                 optimizer = tf.train.experimental.enable_mixed_precision_graph_rewrite(
@@ -502,14 +501,14 @@ def _init_session(self):
                     fp = open(self.disp_file, "w")
                     fp.close()
             elif self.run_opt.init_mode == "init_from_model":
-                log.info("initialize from model %s" % self.run_opt.init_model)
+                log.info(f"initialize from model {self.run_opt.init_model}")
                 run_sess(self.sess, init_op)
                 self.saver.restore(self.sess, self.run_opt.init_model)
                 run_sess(self.sess, self.global_step.assign(0))
                 fp = open(self.disp_file, "w")
                 fp.close()
             elif self.run_opt.init_mode == "restart":
-                log.info("restart from model %s" % self.run_opt.restart)
+                log.info(f"restart from model {self.run_opt.restart}")
                 run_sess(self.sess, init_op)
                 self.saver.restore(self.sess, self.run_opt.restart)
             elif self.run_opt.init_mode == "init_from_frz_model":
@@ -844,7 +843,7 @@ def save_checkpoint(self, cur_batch: int):
                 os.symlink(os.path.relpath(ori_ff, os.path.dirname(new_ff)), new_ff)
             else:
                 shutil.copyfile(ori_ff, new_ff)
-        log.info("saved checkpoint %s" % self.save_ckpt)
+        log.info(f"saved checkpoint {self.save_ckpt}")
 
     def get_feed_dict(self, batch, is_training):
         feed_dict = {}
@@ -970,7 +969,7 @@ def print_on_training(
                 prop_fmt = "   %11.2e"
                 for k in train_results.keys():
                     print_str += prop_fmt % (train_results[k])
-            print_str += "   %8.1e\n" % cur_lr
+            print_str += f"   {cur_lr:8.1e}\n"
         else:
             for fitting_key in train_results:
                 if valid_results[fitting_key] is not None:
@@ -985,7 +984,7 @@ def print_on_training(
                     prop_fmt = "   %11.2e"
                     for k in train_results[fitting_key].keys():
                         print_str += prop_fmt % (train_results[fitting_key][k])
-                print_str += "   %8.1e\n" % cur_lr_dict[fitting_key]
+                print_str += f"   {cur_lr_dict[fitting_key]:8.1e}\n"
         fp.write(print_str)
         fp.flush()
 
@@ -1063,9 +1062,8 @@ def _init_from_frz_model(self):
         except GraphWithoutTensorError as e:
             # throw runtime error if the frozen_model has no model type information...
             raise RuntimeError(
-                "The input frozen model: %s has no 'model_type' information, "
+                f"The input frozen model: {self.run_opt.init_frz_model} has no 'model_type' information, "
                 "which is not supported by the 'dp train init-frz-model' interface. "
-                % self.run_opt.init_frz_model
             ) from e
         else:
             self.model_type = bytes.decode(t_model_type)
@@ -1117,9 +1115,8 @@ def _init_from_pretrained_model(
         except GraphWithoutTensorError as e:
             # throw runtime error if the frozen_model has no model type information...
             raise RuntimeError(
-                "The input frozen pretrained model: %s has no 'model_type' information, "
+                f"The input frozen pretrained model: {self.run_opt.finetune} has no 'model_type' information, "
                 "which is not supported by the 'dp train finetune' interface. "
-                % self.run_opt.finetune
             ) from e
         else:
             self.model_type = bytes.decode(t_model_type)
diff --git a/deepmd/utils/convert.py b/deepmd/utils/convert.py
index 13e07f0885..ff90b596d2 100644
--- a/deepmd/utils/convert.py
+++ b/deepmd/utils/convert.py
@@ -77,8 +77,7 @@ def convert_to_21(input_model: str, output_model: str, version: Optional[str] =
         convert_pb_to_pbtxt(input_model, "frozen_model.pbtxt")
     if version is None:
         raise ValueError(
-            "The version of the DP graph %s cannot be detected. Please do the conversion manually."
-            % (input_model)
+            f"The version of the DP graph {input_model} cannot be detected. Please do the conversion manually."
         )
     if version in SpecifierSet("<1.0"):
         convert_dp012_to_dp10("frozen_model.pbtxt")
diff --git a/deepmd/utils/finetune.py b/deepmd/utils/finetune.py
index 922d131b7e..84b0da962f 100644
--- a/deepmd/utils/finetune.py
+++ b/deepmd/utils/finetune.py
@@ -33,10 +33,9 @@ def replace_model_params_with_pretrained_model(
         t_jdata = get_tensor_by_name(pretrained_model, "train_attr/training_script")
     except GraphWithoutTensorError as e:
         raise RuntimeError(
-            "The input frozen pretrained model: %s has no training script, "
+            f"The input frozen pretrained model: {input} has no training script, "
             "which is not supported to perform finetuning. "
             "Please use the model pretrained with v2.1.5 or higher version of DeePMD-kit."
-            % input
         ) from e
     pretrained_jdata = json.loads(t_jdata)
 
diff --git a/deepmd/utils/multi_init.py b/deepmd/utils/multi_init.py
index d29a42cf0f..83de69e3a0 100644
--- a/deepmd/utils/multi_init.py
+++ b/deepmd/utils/multi_init.py
@@ -33,10 +33,9 @@ def replace_model_params_with_frz_multi_model(
         t_jdata = get_tensor_by_name(pretrained_model, "train_attr/training_script")
     except GraphWithoutTensorError as e:
         raise RuntimeError(
-            "The input frozen pretrained model: %s has no training script, "
+            f"The input frozen pretrained model: {input} has no training script, "
             "which is not supported to perform multi-task training. "
             "Please use the model pretrained with v2.1.5 or higher version of DeePMD-kit."
-            % input
         ) from e
     pretrained_jdata = json.loads(t_jdata)
 
diff --git a/deepmd/utils/neighbor_stat.py b/deepmd/utils/neighbor_stat.py
index 982ead3549..51c8c99658 100644
--- a/deepmd/utils/neighbor_stat.py
+++ b/deepmd/utils/neighbor_stat.py
@@ -210,16 +210,15 @@ def get_stat(self, data: DeepmdDataSystem) -> Tuple[float, np.ndarray]:
         for mn, dt, jj in self.iterator(data):
             if np.isinf(dt):
                 log.warning(
-                    "Atoms with no neighbors found in %s. Please make sure it's what you expected."
-                    % jj
+                    f"Atoms with no neighbors found in {jj}. Please make sure it's what you expected."
                 )
             if dt < min_nbor_dist:
                 if math.isclose(dt, 0.0, rel_tol=1e-6):
                     # it's unexpected that the distance between two atoms is zero
                     # zero distance will cause nan (#874)
                     raise RuntimeError(
-                        "Some atoms are overlapping in %s. Please check your"
-                        " training data to remove duplicated atoms." % jj
+                        f"Some atoms are overlapping in {jj}. Please check your"
+                        " training data to remove duplicated atoms."
                     )
                 min_nbor_dist = dt
             max_nbor_size = np.maximum(mn, max_nbor_size)
diff --git a/deepmd_utils/entrypoints/doc.py b/deepmd_utils/entrypoints/doc.py
index 2c2c5e8451..457796c026 100644
--- a/deepmd_utils/entrypoints/doc.py
+++ b/deepmd_utils/entrypoints/doc.py
@@ -16,5 +16,5 @@ def doc_train_input(*, out_type: str = "rst", **kwargs):
     elif out_type == "json":
         doc_str = gen_json()
     else:
-        raise RuntimeError("Unsupported out type %s" % out_type)
+        raise RuntimeError(f"Unsupported out type {out_type}")
     print(doc_str)  # noqa: T201
diff --git a/deepmd_utils/env.py b/deepmd_utils/env.py
index b1d4958ed8..75a3ecf288 100644
--- a/deepmd_utils/env.py
+++ b/deepmd_utils/env.py
@@ -22,7 +22,7 @@
     global_float_prec = "float"
 else:
     raise RuntimeError(
-        "Unsupported float precision option: %s. Supported: high,"
+        f"Unsupported float precision option: {dp_float_prec}. Supported: high,"
         "low. Please set precision with environmental variable "
-        "DP_INTERFACE_PREC." % dp_float_prec
+        "DP_INTERFACE_PREC."
     )
diff --git a/deepmd_utils/main.py b/deepmd_utils/main.py
index ae4852acc9..82dacdbac2 100644
--- a/deepmd_utils/main.py
+++ b/deepmd_utils/main.py
@@ -544,7 +544,7 @@ def main_parser() -> argparse.ArgumentParser:
 
     # --version
     parser.add_argument(
-        "--version", action="version", version="DeePMD-kit v%s" % __version__
+        "--version", action="version", version=f"DeePMD-kit v{__version__}"
     )
 
     # * train nvnmd script ******************************************************************
diff --git a/deepmd_utils/utils/argcheck.py b/deepmd_utils/utils/argcheck.py
index d32d22e359..29886dd54f 100644
--- a/deepmd_utils/utils/argcheck.py
+++ b/deepmd_utils/utils/argcheck.py
@@ -365,7 +365,7 @@ def descrpt_se_atten_common_args():
     doc_seed = "Random seed for parameter initialization"
     doc_exclude_types = "The excluded pairs of types which have no interaction with each other. For example, `[[0, 1]]` means no interaction between type 0 and type 1."
     doc_attn = "The length of hidden vectors in attention layers"
-    doc_attn_layer = "The number of attention layers. Note that model compression of `se_atten` is only enabled when attn_layer==0 and stripped_type_embedding is True"
+    doc_attn_layer = "The number of attention layers."
     doc_attn_dotr = "Whether to do dot product with the normalized relative coordinates"
     doc_attn_mask = "Whether to do mask on the diagonal in the attention matrix"
 
@@ -417,7 +417,7 @@ def descrpt_se_atten_common_args():
 @descrpt_args_plugin.register("se_atten")
 def descrpt_se_atten_args():
     doc_stripped_type_embedding = "Whether to strip the type embedding into a separated embedding network. Setting it to `False` will fall back to the previous version of `se_atten` which is non-compressible."
-    doc_smooth_type_embdding = "When using stripped type embedding, whether to dot smooth factor on the network output of type embedding to keep the network smooth, instead of setting `set_davg_zero` to be True."
+    doc_smooth_type_embedding = "When using stripped type embedding, whether to dot smooth factor on the network output of type embedding to keep the network smooth, instead of setting `set_davg_zero` to be True."
     doc_set_davg_zero = "Set the normalization average to zero. This option should be set when `se_atten` descriptor or `atom_ener` in the energy fitting is used"
 
     return [
@@ -430,11 +430,12 @@ def descrpt_se_atten_args():
             doc=doc_stripped_type_embedding,
         ),
         Argument(
-            "smooth_type_embdding",
+            "smooth_type_embedding",
             bool,
             optional=True,
             default=False,
-            doc=doc_smooth_type_embdding,
+            alias=["smooth_type_embdding"],
+            doc=doc_smooth_type_embedding,
         ),
         Argument(
             "set_davg_zero", bool, optional=True, default=True, doc=doc_set_davg_zero
diff --git a/deepmd_utils/utils/batch_size.py b/deepmd_utils/utils/batch_size.py
index 1b93a51242..8a60cc69fb 100644
--- a/deepmd_utils/utils/batch_size.py
+++ b/deepmd_utils/utils/batch_size.py
@@ -62,6 +62,11 @@ def __init__(self, initial_batch_size: int = 1024, factor: float = 2.0) -> None:
             self.maximum_working_batch_size = initial_batch_size
             if self.is_gpu_available():
                 self.minimal_not_working_batch_size = 2**31
+                log.info(
+                    "If you encounter the error 'an illegal memory access was encountered', this may be due to a TensorFlow issue. "
+                    "To avoid this, set the environment variable DP_INFER_BATCH_SIZE to a smaller value than the last adjusted batch size. "
+                    "The environment variable DP_INFER_BATCH_SIZE controls the inference batch size (nframes * natoms). "
+                )
             else:
                 self.minimal_not_working_batch_size = (
                     self.maximum_working_batch_size + 1
diff --git a/deepmd_utils/utils/data.py b/deepmd_utils/utils/data.py
index 534216dfaf..6494d25675 100644
--- a/deepmd_utils/utils/data.py
+++ b/deepmd_utils/utils/data.py
@@ -359,7 +359,7 @@ def get_natoms_vec(self, ntypes: int):
     def avg(self, key):
         """Return the average value of an item."""
         if key not in self.data_dict.keys():
-            raise RuntimeError("key %s has not been added" % key)
+            raise RuntimeError(f"key {key} has not been added")
         info = self.data_dict[key]
         ndof = info["ndof"]
         eners = []
@@ -568,7 +568,7 @@ def _load_data(
                 data = np.repeat(data, repeat).reshape([nframes, -1])
             return np.float32(1.0), data
         elif must:
-            raise RuntimeError("%s not found!" % path)
+            raise RuntimeError(f"{path} not found!")
         else:
             data = np.full([nframes, ndof], default, dtype=dtype)
             if repeat != 1:
diff --git a/deepmd_utils/utils/data_system.py b/deepmd_utils/utils/data_system.py
index f83f587590..a2abca85db 100644
--- a/deepmd_utils/utils/data_system.py
+++ b/deepmd_utils/utils/data_system.py
@@ -559,7 +559,7 @@ def print_summary(self, name):
         )
         log.info("found %d system(s):" % self.nsystems)
         log.info(
-            ("%s  " % self._format_name_length("system", sys_width))
+            ("{}  ".format(self._format_name_length("system", sys_width)))
             + ("%6s  %6s  %6s  %9s  %3s" % ("natoms", "bch_sz", "n_bch", "prob", "pbc"))
         )
         for ii in range(self.nsystems):
diff --git a/deepmd_utils/utils/path.py b/deepmd_utils/utils/path.py
index a8e4bc329f..751ee3731e 100644
--- a/deepmd_utils/utils/path.py
+++ b/deepmd_utils/utils/path.py
@@ -39,7 +39,7 @@ def __new__(cls, path: str):
                 # assume h5 if it is not dir
                 # TODO: check if it is a real h5? or just check suffix?
                 return super().__new__(DPH5Path)
-            raise FileNotFoundError("%s not found" % path)
+            raise FileNotFoundError(f"{path} not found")
         return super().__new__(cls)
 
     @abstractmethod
diff --git a/doc/conf.py b/doc/conf.py
index fae850a132..09dc43fa68 100644
--- a/doc/conf.py
+++ b/doc/conf.py
@@ -174,7 +174,7 @@ def setup(app):
 import typing
 
 for typing_type in typing.__all__:
-    numpydoc_xref_aliases[typing_type] = "typing.%s" % typing_type
+    numpydoc_xref_aliases[typing_type] = f"typing.{typing_type}"
 
 rst_epilog = f"""
 .. |ACTIVATION_FN| replace:: {list_to_doc(ACTIVATION_FN_DICT.keys())}
diff --git a/doc/credits.rst b/doc/credits.rst
index 3fbe1d56d8..d60279614b 100644
--- a/doc/credits.rst
+++ b/doc/credits.rst
@@ -47,7 +47,7 @@ Cite DeePMD-kit and methods
 .. bibliography::
    :filter: False
 
-   Zhang_2022_DPA1
+   Zhang_NpjComputMater_2024_v10_p94
 
 - If frame-specific parameters (`fparam`, e.g. electronic temperature) is used,
 
diff --git a/doc/freeze/compress.md b/doc/freeze/compress.md
index 54b9baf7ca..87d4699d2b 100644
--- a/doc/freeze/compress.md
+++ b/doc/freeze/compress.md
@@ -148,6 +148,8 @@ The model compression interface requires the version of DeePMD-kit used in the o
 
 Descriptors with `se_e2_a`, `se_e3`, `se_e2_r` and `se_atten_v2` types are supported by the model compression feature. `Hybrid` mixed with the above descriptors is also supported.
 
+Notice: Model compression for the `se_atten_v2` descriptor is exclusively designed for models with the training parameter {ref}`attn_layer <model/descriptor[se_atten_v2]/attn_layer>` set to 0.
+
 **Available activation functions for descriptor:**
 
 - tanh
diff --git a/doc/getting-started/quick_start.ipynb b/doc/getting-started/quick_start.ipynb
index 67674c4654..67462c91d4 100644
--- a/doc/getting-started/quick_start.ipynb
+++ b/doc/getting-started/quick_start.ipynb
@@ -396,7 +396,7 @@
     }
    ],
    "source": [
-    "! cat DeePMD-kit_Tutorial/00.data/training_data/type.raw "
+    "! cat DeePMD-kit_Tutorial/00.data/training_data/type.raw"
    ]
   },
   {
diff --git a/doc/model/train-se-atten.md b/doc/model/train-se-atten.md
index 5a47170958..fef910b0a7 100644
--- a/doc/model/train-se-atten.md
+++ b/doc/model/train-se-atten.md
@@ -17,7 +17,11 @@ Attention-based descriptor $\mathcal{D}^i \in \mathbb{R}^{M \times M_{<}}$, whic
 ```
 
 where $\hat{\mathcal{G}}^i$ represents the embedding matrix $\mathcal{G}^i$ after additional self-attention mechanism and $\mathcal{R}^i$ is defined by the full case in the [`se_e2_a`](./train-se-e2-a.md).
-Note that we obtain $\mathcal{G}^i$ using the type embedding method by default in this descriptor.
+Note that we obtain $\mathcal{G}^i$ using the type embedding method by default in this descriptor. By default, we concat $s(r_{ij})$ and the type embeddings of central and neighboring atoms $\mathcal{A}^i$ and $\mathcal{A}^j$ as input of the embedding network $\mathcal{N}_{e,2}$:
+
+```math
+   (\mathcal{G}^i)_j = \mathcal{N}_{e,2}(\{s(r_{ij}), \mathcal{A}^i, \mathcal{A}^j\})  \quad \mathrm{or}\quad(\mathcal{G}^i)_j = \mathcal{N}_{e,2}(\{s(r_{ij}), \mathcal{A}^j\})
+```
 
 To perform the self-attention mechanism, the queries $\mathcal{Q}^{i,l} \in \mathbb{R}^{N_c\times d_k}$, keys $\mathcal{K}^{i,l} \in \mathbb{R}^{N_c\times d_k}$, and values $\mathcal{V}^{i,l} \in \mathbb{R}^{N_c\times d_v}$ are first obtained:
 
@@ -114,12 +118,20 @@ We highly recommend using the version 2.0 of the attention-based descriptor `"se
 
 ```json
       "stripped_type_embedding": true,
-      "smooth_type_embdding": true,
+      "smooth_type_embedding": true,
       "set_davg_zero": false
 ```
 
+You need to use descriptor `"se_atten_v2"` and do not need to set `stripped_type_embedding` and `smooth_type_embedding` because the default value of `stripped_type_embedding` is `true`, and the default value of `smooth_type_embedding` is `true`. When `stripped_type_embedding` is set to `true`, the embedding matrix $\mathcal{G}^i$ is constructed as:
+
+```math
+   (\mathcal{G}^i)_j = \mathcal{N}_{e,2}(s(r_{ij})) + \mathcal{N}_{e,2}(s(r_{ij})) \odot ({N}_{e,2}(\{\mathcal{A}^i, \mathcal{A}^j\}) \odot s(r_{ij})) \quad \mathrm{or}
+```
+
 Practical evidence demonstrates that `"se_atten_v2"` offers better and more stable performance compared to `"se_atten"`.
 
+Notice: Model compression for the `se_atten_v2` descriptor is exclusively designed for models with the training parameter {ref}`attn_layer <model/descriptor[se_atten_v2]/attn_layer>` set to 0.
+
 ### Fitting `"ener"`
 
 DPA-1 only supports `"ener"` fitting type, and you can refer [here](train-energy.md) for detailed information.
diff --git a/doc/requirements.txt b/doc/requirements.txt
index 1d39662bb4..b011900147 100644
--- a/doc/requirements.txt
+++ b/doc/requirements.txt
@@ -1 +1,4 @@
-.[docs,cpu]
+.[docs,cpu,torch]
+exhale @ https://github.com/svenevs/exhale/archive/2759a394268307b88f5440487ae0920ee4ebf81e.zip
+# https://github.com/mcmtroffaes/sphinxcontrib-bibtex/issues/309
+docutils!=0.18.*,!=0.19.*
diff --git a/pyproject.toml b/pyproject.toml
index 1b4d459a7d..7a5f892b6f 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -44,6 +44,7 @@ dependencies = [
     'typing_extensions; python_version < "3.8"',
     'importlib_metadata>=1.4; python_version < "3.8"',
     'h5py',
+    "h5py>=3.6.0,<3.11.0; platform_system=='Linux' and platform_machine=='aarch64'",
     'wcmatch',
     'packaging',
 ]
@@ -66,7 +67,11 @@ repository = "https://github.com/deepmodeling/deepmd-kit"
 [tool.deepmd_build_backend.optional-dependencies]
 test = [
     "dpdata>=0.2.7",
-    "ase",
+    # ASE issue: https://gitlab.com/ase/ase/-/merge_requests/2843
+    # fixed in 3.23.0
+    # ase>=3.23.0 requires python>=3.8; luckily, we don't test i-PI with python<3.8
+    'ase>=3.23.0;python_version>="3.8"',
+    'ase;python_version<"3.8"',
     "pytest",
     "pytest-cov",
     "pytest-sugar",
@@ -92,7 +97,7 @@ lmp = [
     "lammps~=2023.8.2.3.0",
 ]
 ipi = [
-    "i-PI",
+    "ipi",
 ]
 gui = [
     "dpgui",
@@ -222,6 +227,12 @@ before-all = [
     """rpm --import https://repo.almalinux.org/almalinux/RPM-GPG-KEY-AlmaLinux""",
     """{ if [ "$(uname -m)" = "x86_64" ] ; then yum config-manager --add-repo http://developer.download.nvidia.com/compute/cuda/repos/rhel8/x86_64/cuda-rhel8.repo && yum install -y cuda-nvcc-${CUDA_VERSION/./-} cuda-cudart-devel-${CUDA_VERSION/./-}; fi }""",
     "yum install -y mpich-devel",
+    # uv is not available in the old manylinux image
+    """{ if [ "$(uname -m)" = "x86_64" ] ; then pipx install uv; fi }""",
+]
+before-build = [
+    # old build doesn't support uv
+    """{ if [ "$(uname -m)" = "x86_64" ] ; then uv pip install --system -U build; fi }""",
 ]
 
 [tool.cibuildwheel.windows]
@@ -287,6 +298,7 @@ force_grid_wrap = 1
 [tool.ruff.lint]
 select = [
     "E", # errors
+    "W", # warning
     "F", # pyflakes
     "D", # pydocstyle
     "UP", # pyupgrade
diff --git a/source/CMakeLists.txt b/source/CMakeLists.txt
index f7bef0b2d9..cbc73735fe 100644
--- a/source/CMakeLists.txt
+++ b/source/CMakeLists.txt
@@ -145,6 +145,8 @@ endif(USE_TF_PYTHON_LIBS)
 # find tensorflow, I need tf abi info
 if(NOT DEEPMD_C_ROOT)
   find_package(tensorflow REQUIRED)
+  list(APPEND BACKEND_LIBRARY_PATH ${TensorFlow_LIBRARY_PATH})
+  list(APPEND BACKEND_INCLUDE_DIRS ${TENSORFLOW_INCLUDE_DIRS})
 endif()
 
 # find threads
@@ -233,7 +235,9 @@ if(DEEPMD_C_ROOT)
   # use variable for TF path to set deepmd_c path
   set(TENSORFLOW_ROOT "${DEEPMD_C_ROOT}")
   set(TensorFlow_LIBRARY_PATH "${DEEPMD_C_ROOT}/lib")
+  set(BACKEND_LIBRARY_PATH "${DEEPMD_C_ROOT}/lib")
   set(TENSORFLOW_INCLUDE_DIRS "${DEEPMD_C_ROOT}/include")
+  set(BACKEND_INCLUDE_DIRS "${DEEPMD_C_ROOT}/include")
 endif()
 
 if(NOT DEEPMD_C_ROOT)
diff --git a/source/api_c/CMakeLists.txt b/source/api_c/CMakeLists.txt
index f6e741105a..f0b36a62d7 100644
--- a/source/api_c/CMakeLists.txt
+++ b/source/api_c/CMakeLists.txt
@@ -12,8 +12,8 @@ target_include_directories(
   ${libname} PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/include>
                     $<INSTALL_INTERFACE:include>)
 
-set_target_properties(
-  ${libname} PROPERTIES INSTALL_RPATH "$ORIGIN;${TensorFlow_LIBRARY_PATH}")
+set_target_properties(${libname} PROPERTIES INSTALL_RPATH
+                                            "$ORIGIN;${BACKEND_LIBRARY_PATH}")
 if(CMAKE_TESTING_ENABLED)
   target_link_libraries(${libname} PRIVATE coverage_config)
 endif()
diff --git a/source/api_c/include/deepmd.hpp b/source/api_c/include/deepmd.hpp
index f348a3dbe9..059612f7af 100644
--- a/source/api_c/include/deepmd.hpp
+++ b/source/api_c/include/deepmd.hpp
@@ -25,9 +25,9 @@ namespace hpp {
  **/
 struct deepmd_exception : public std::runtime_error {
  public:
-  deepmd_exception() : runtime_error("DeePMD-kit C API Error!"){};
+  deepmd_exception() : runtime_error("DeePMD-kit C API Error!") {};
   deepmd_exception(const std::string &msg)
-      : runtime_error(std::string("DeePMD-kit C API Error: ") + msg){};
+      : runtime_error(std::string("DeePMD-kit C API Error: ") + msg) {};
 };
 }  // namespace hpp
 }  // namespace deepmd
@@ -620,7 +620,7 @@ class DeepPot {
   /**
    * @brief DP constructor without initialization.
    **/
-  DeepPot() : dp(nullptr){};
+  DeepPot() : dp(nullptr) {};
   ~DeepPot() { DP_DeleteDeepPot(dp); };
   /**
    * @brief DP constructor with initialization.
@@ -1160,7 +1160,7 @@ class DeepPotModelDevi {
   /**
    * @brief DP model deviation constructor without initialization.
    **/
-  DeepPotModelDevi() : dp(nullptr){};
+  DeepPotModelDevi() : dp(nullptr) {};
   ~DeepPotModelDevi() { DP_DeleteDeepPotModelDevi(dp); };
   /**
    * @brief DP model deviation constructor with initialization.
@@ -1785,7 +1785,7 @@ class DeepTensor {
   /**
    * @brief Deep Tensor constructor without initialization.
    **/
-  DeepTensor() : dt(nullptr){};
+  DeepTensor() : dt(nullptr) {};
   ~DeepTensor() { DP_DeleteDeepTensor(dt); };
   /**
    * @brief DeepTensor constructor with initialization.
@@ -2161,7 +2161,7 @@ class DipoleChargeModifier {
   /**
    * @brief DipoleChargeModifier constructor without initialization.
    **/
-  DipoleChargeModifier() : dcm(nullptr){};
+  DipoleChargeModifier() : dcm(nullptr) {};
   ~DipoleChargeModifier() { DP_DeleteDipoleChargeModifier(dcm); };
   /**
    * @brief DipoleChargeModifier constructor with initialization.
diff --git a/source/api_c/tests/CMakeLists.txt b/source/api_c/tests/CMakeLists.txt
index d4233a83e8..1b035b1a6c 100644
--- a/source/api_c/tests/CMakeLists.txt
+++ b/source/api_c/tests/CMakeLists.txt
@@ -4,7 +4,7 @@ project(deepmd_api_c_test)
 file(GLOB TEST_SRC test_*.cc)
 
 set_target_properties(
-  ${LIB_DEEPMD_C} PROPERTIES INSTALL_RPATH "$ORIGIN;${TensorFlow_LIBRARY_PATH}")
+  ${LIB_DEEPMD_C} PROPERTIES INSTALL_RPATH "$ORIGIN;${BACKEND_LIBRARY_PATH}")
 
 add_executable(runUnitTests_c ${TEST_SRC})
 target_link_libraries(runUnitTests_c PRIVATE GTest::gtest_main ${LIB_DEEPMD_C}
diff --git a/source/api_c/tests/test_deeppot_a_hpp.cc b/source/api_c/tests/test_deeppot_a_hpp.cc
index 814122d538..388b53fdfd 100644
--- a/source/api_c/tests/test_deeppot_a_hpp.cc
+++ b/source/api_c/tests/test_deeppot_a_hpp.cc
@@ -140,7 +140,7 @@ TYPED_TEST(TestInferDeepPotAHPP, cpu_build_nlist_numfv) {
 
    public:
     MyModel(deepmd::hpp::DeepPot& dp_, const std::vector<int>& atype_)
-        : mydp(dp_), atype(atype_){};
+        : mydp(dp_), atype(atype_) {};
     virtual void compute(double& ener,
                          std::vector<VALUETYPE>& force,
                          std::vector<VALUETYPE>& virial,
diff --git a/source/api_cc/CMakeLists.txt b/source/api_cc/CMakeLists.txt
index 2f296e3dfd..15d3844b36 100644
--- a/source/api_cc/CMakeLists.txt
+++ b/source/api_cc/CMakeLists.txt
@@ -25,8 +25,10 @@ if(Protobuf_LIBRARY)
 endif()
 
 set_target_properties(
-  ${libname} PROPERTIES INSTALL_RPATH "$ORIGIN;${TensorFlow_LIBRARY_PATH}"
-                        BUILD_RPATH "$ORIGIN/../op")
+  ${libname}
+  PROPERTIES INSTALL_RPATH "$ORIGIN;${BACKEND_LIBRARY_PATH}"
+             INSTALL_RPATH_USE_LINK_PATH TRUE
+             BUILD_RPATH "$ORIGIN/../op")
 target_compile_definitions(${libname} PRIVATE TF_PRIVATE)
 if(CMAKE_TESTING_ENABLED)
   target_link_libraries(${libname} PRIVATE coverage_config)
diff --git a/source/api_cc/include/DataModifier.h b/source/api_cc/include/DataModifier.h
index 0f46b5e0f8..9933f034a6 100644
--- a/source/api_cc/include/DataModifier.h
+++ b/source/api_cc/include/DataModifier.h
@@ -14,7 +14,7 @@ class DipoleChargeModifierBase {
   /**
    * @brief Dipole charge modifier without initialization.
    **/
-  DipoleChargeModifierBase(){};
+  DipoleChargeModifierBase() {};
   /**
    * @brief Dipole charge modifier without initialization.
    * @param[in] model The name of the frozen model file.
@@ -24,7 +24,7 @@ class DipoleChargeModifierBase {
   DipoleChargeModifierBase(const std::string& model,
                            const int& gpu_rank = 0,
                            const std::string& name_scope = "");
-  virtual ~DipoleChargeModifierBase(){};
+  virtual ~DipoleChargeModifierBase() {};
   /**
    * @brief Initialize the dipole charge modifier.
    * @param[in] model The name of the frozen model file.
diff --git a/source/api_cc/include/DeepPot.h b/source/api_cc/include/DeepPot.h
index fa35d4b13a..3da5c34184 100644
--- a/source/api_cc/include/DeepPot.h
+++ b/source/api_cc/include/DeepPot.h
@@ -15,8 +15,8 @@ class DeepPotBase {
   /**
    * @brief DP constructor without initialization.
    **/
-  DeepPotBase(){};
-  virtual ~DeepPotBase(){};
+  DeepPotBase() {};
+  virtual ~DeepPotBase() {};
   /**
    * @brief DP constructor with initialization.
    * @param[in] model The name of the frozen model file.
diff --git a/source/api_cc/include/DeepTensor.h b/source/api_cc/include/DeepTensor.h
index 5592942d87..f355413d80 100644
--- a/source/api_cc/include/DeepTensor.h
+++ b/source/api_cc/include/DeepTensor.h
@@ -15,8 +15,8 @@ class DeepTensorBase {
   /**
    * @brief Deep Tensor constructor without initialization.
    **/
-  DeepTensorBase(){};
-  virtual ~DeepTensorBase(){};
+  DeepTensorBase() {};
+  virtual ~DeepTensorBase() {};
   /**
    * @brief Deep Tensor constructor with initialization..
    * @param[in] model The name of the frozen model file.
diff --git a/source/api_cc/include/common.h b/source/api_cc/include/common.h
index 7982c4f89d..ede34b68c9 100644
--- a/source/api_cc/include/common.h
+++ b/source/api_cc/include/common.h
@@ -170,9 +170,9 @@ void load_op_library();
  **/
 struct tf_exception : public deepmd::deepmd_exception {
  public:
-  tf_exception() : deepmd::deepmd_exception("TensorFlow Error!"){};
+  tf_exception() : deepmd::deepmd_exception("TensorFlow Error!") {};
   tf_exception(const std::string& msg)
-      : deepmd::deepmd_exception(std::string("TensorFlow Error: ") + msg){};
+      : deepmd::deepmd_exception(std::string("TensorFlow Error: ") + msg) {};
 };
 
 /**
diff --git a/source/api_cc/src/DataModifier.cc b/source/api_cc/src/DataModifier.cc
index d44d552bb2..e9aee65de2 100644
--- a/source/api_cc/src/DataModifier.cc
+++ b/source/api_cc/src/DataModifier.cc
@@ -15,7 +15,7 @@ DipoleChargeModifier::DipoleChargeModifier(const std::string& model,
   init(model, gpu_rank, name_scope_);
 }
 
-DipoleChargeModifier::~DipoleChargeModifier(){};
+DipoleChargeModifier::~DipoleChargeModifier() {};
 
 void DipoleChargeModifier::init(const std::string& model,
                                 const int& gpu_rank,
diff --git a/source/api_cc/tests/test_deeppot_a.cc b/source/api_cc/tests/test_deeppot_a.cc
index 067b2ff524..ae1384e8a3 100644
--- a/source/api_cc/tests/test_deeppot_a.cc
+++ b/source/api_cc/tests/test_deeppot_a.cc
@@ -143,7 +143,7 @@ TYPED_TEST(TestInferDeepPotA, cpu_build_nlist_numfv) {
 
    public:
     MyModel(deepmd::DeepPot& dp_, const std::vector<int>& atype_)
-        : mydp(dp_), atype(atype_){};
+        : mydp(dp_), atype(atype_) {};
     virtual void compute(double& ener,
                          std::vector<VALUETYPE>& force,
                          std::vector<VALUETYPE>& virial,
diff --git a/source/api_cc/tests/test_deeppot_r.cc b/source/api_cc/tests/test_deeppot_r.cc
index 8eec36522e..86fa4b091f 100644
--- a/source/api_cc/tests/test_deeppot_r.cc
+++ b/source/api_cc/tests/test_deeppot_r.cc
@@ -143,7 +143,7 @@ TYPED_TEST(TestInferDeepPotR, cpu_build_nlist_numfv) {
 
    public:
     MyModel(deepmd::DeepPot& dp_, const std::vector<int>& atype_)
-        : mydp(dp_), atype(atype_){};
+        : mydp(dp_), atype(atype_) {};
     virtual void compute(double& ener,
                          std::vector<VALUETYPE>& force,
                          std::vector<VALUETYPE>& virial,
diff --git a/source/gmx/CMakeLists.txt b/source/gmx/CMakeLists.txt
index d445479d39..8fde1e6ab8 100644
--- a/source/gmx/CMakeLists.txt
+++ b/source/gmx/CMakeLists.txt
@@ -26,7 +26,7 @@ target_include_directories(${libgmxname}
                            PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/../3rdparty/)
 
 set_target_properties(
-  ${libgmxname} PROPERTIES INSTALL_RPATH "$ORIGIN;${TensorFlow_LIBRARY_PATH}")
+  ${libgmxname} PROPERTIES INSTALL_RPATH "$ORIGIN;${BACKEND_LIBRARY_PATH}")
 
 install(
   FILES dp_gmx_patch
diff --git a/source/install/build_tf.py b/source/install/build_tf.py
index 15847d2c21..13f773ce2c 100755
--- a/source/install/build_tf.py
+++ b/source/install/build_tf.py
@@ -192,7 +192,7 @@ def path(self) -> Path:
     @property
     def gzip_path(self) -> Path:
         if self.gzip is None:
-            raise RuntimeError("gzip is None for %s" % self.path)
+            raise RuntimeError(f"gzip is None for {self.path}")
         return PACKAGE_DIR / self.gzip
 
     @property
@@ -257,10 +257,9 @@ def __call__(self):
                     dd()
                 else:
                     dlog.info(
-                        "Skip installing %s, which has been already installed"
-                        % dd.__class__.__name__
+                        f"Skip installing {dd.__class__.__name__}, which has been already installed"
                     )
-            dlog.info("Start installing %s..." % self.__class__.__name__)
+            dlog.info(f"Start installing {self.__class__.__name__}...")
             with tempfile.TemporaryDirectory() as tmpdirname:
                 self._prefix = Path(tmpdirname)
                 self.build()
@@ -621,7 +620,7 @@ def dependencies(self) -> Dict[str, Build]:
 
     def build(self):
         tf_res = self.resources["tensorflow"]
-        src = tf_res.gzip_path / ("tensorflow-%s" % self.version)
+        src = tf_res.gzip_path / (f"tensorflow-{self.version}")
         with set_directory(src):
             # configure -- need bazelisk in PATH
             call(
diff --git a/source/install/docker/Dockerfile b/source/install/docker/Dockerfile
index 26b7be9f19..237480bfb8 100644
--- a/source/install/docker/Dockerfile
+++ b/source/install/docker/Dockerfile
@@ -1,12 +1,14 @@
 FROM python:3.11 AS compile-image
 ARG VARIANT=""
 ARG CUDA_VERSION="12"
-RUN python -m venv /opt/deepmd-kit
+RUN python -m pip install uv
+RUN python -m uv venv /opt/deepmd-kit
 # Make sure we use the virtualenv
 ENV PATH="/opt/deepmd-kit/bin:$PATH"
+ENV VIRTUAL_ENV="/opt/deepmd-kit"
 # Install package
 COPY dist /dist
-RUN pip install "$(ls /dist/deepmd_kit${VARIANT}-*manylinux*_x86_64.whl)[gpu,cu${CUDA_VERSION},lmp,ipi]" \
+RUN uv pip install "$(ls /dist/deepmd_kit${VARIANT}-*manylinux*_x86_64.whl)[gpu,cu${CUDA_VERSION},lmp,ipi]" \
     && dp -h \
     && lmp -h \
     && dp_ipi \
diff --git a/source/install/docker_package_c.sh b/source/install/docker_package_c.sh
index 544c175a0a..3846daf93b 100755
--- a/source/install/docker_package_c.sh
+++ b/source/install/docker_package_c.sh
@@ -5,6 +5,7 @@ SCRIPT_PATH=$(dirname $(realpath -s $0))
 docker run --rm -v ${SCRIPT_PATH}/../..:/root/deepmd-kit -w /root/deepmd-kit \
 	tensorflow/build:${TENSORFLOW_BUILD_VERSION:-2.15}-python3.11 \
 	/bin/sh -c "pip install \"tensorflow${TENSORFLOW_VERSION}\" cmake \
+            && git config --global --add safe.directory /root/deepmd-kit \
             && cd /root/deepmd-kit/source/install \
             && CC=/dt9/usr/bin/gcc \
                CXX=/dt9/usr/bin/g++ \
diff --git a/source/install/uv_with_retry.sh b/source/install/uv_with_retry.sh
new file mode 100755
index 0000000000..2d9a524f6b
--- /dev/null
+++ b/source/install/uv_with_retry.sh
@@ -0,0 +1,32 @@
+#!/bin/bash
+# This script is used to retry the uv command if the error "error decoding response body" is encountered.
+# See also:
+# https://github.com/astral-sh/uv/issues/2586
+# https://github.com/astral-sh/uv/issues/3456
+# https://github.com/astral-sh/uv/issues/3514
+# https://github.com/astral-sh/uv/issues/4402
+tmpstderr=$(mktemp)
+max_retry=3
+while true; do
+	uv "$@" 2> >(tee -a "${tmpstderr}" >&2)
+	exit_code=$?
+	# exit if ok
+	if [ $exit_code -eq 0 ]; then
+		rm -f "${tmpstderr}"
+		exit 0
+	fi
+	# check if "error decoding response body" is in the stderr
+	if grep -q "error decoding response body" "${tmpstderr}"; then
+		echo "Retrying uv in 1 s..."
+		max_retry=$((max_retry - 1))
+		if [ $max_retry -eq 0 ]; then
+			echo "Max retry reached, exiting..."
+			rm -f "${tmpstderr}"
+			exit 1
+		fi
+		sleep 1
+	else
+		rm -f "${tmpstderr}"
+		exit $exit_code
+	fi
+done
diff --git a/source/ipi/CMakeLists.txt b/source/ipi/CMakeLists.txt
index 158f98aea5..2b23a63c76 100644
--- a/source/ipi/CMakeLists.txt
+++ b/source/ipi/CMakeLists.txt
@@ -44,13 +44,13 @@ if(APPLE)
     ${ipiname}
     PROPERTIES LINK_FLAGS "${extra_link_flags}"
                INSTALL_RPATH
-               "@loader_path/../${LIB_DIR}:${TensorFlow_LIBRARY_PATH}")
+               "@loader_path/../${LIB_DIR};${BACKEND_LIBRARY_PATH}")
 else()
   set_target_properties(
     ${ipiname}
     PROPERTIES LINK_FLAGS
                "-Wl,-rpath,'$ORIGIN'/../${LIB_DIR} ${extra_link_flags}"
-               INSTALL_RPATH "$ORIGIN/../${LIB_DIR}:${TensorFlow_LIBRARY_PATH}")
+               INSTALL_RPATH "$ORIGIN/../${LIB_DIR};${BACKEND_LIBRARY_PATH}")
 endif()
 
 if(CMAKE_TESTING_ENABLED)
diff --git a/source/lib/include/errors.h b/source/lib/include/errors.h
index 6687d2afa2..d0de379537 100644
--- a/source/lib/include/errors.h
+++ b/source/lib/include/errors.h
@@ -10,15 +10,15 @@ namespace deepmd {
  **/
 struct deepmd_exception : public std::runtime_error {
  public:
-  deepmd_exception() : runtime_error("DeePMD-kit Error!"){};
+  deepmd_exception() : runtime_error("DeePMD-kit Error!") {};
   deepmd_exception(const std::string& msg)
-      : runtime_error(std::string("DeePMD-kit Error: ") + msg){};
+      : runtime_error(std::string("DeePMD-kit Error: ") + msg) {};
 };
 
 struct deepmd_exception_oom : public deepmd_exception {
  public:
-  deepmd_exception_oom() : deepmd_exception("DeePMD-kit OOM!"){};
+  deepmd_exception_oom() : deepmd_exception("DeePMD-kit OOM!") {};
   deepmd_exception_oom(const std::string& msg)
-      : deepmd_exception(std::string("DeePMD-kit OOM: ") + msg){};
+      : deepmd_exception(std::string("DeePMD-kit OOM: ") + msg) {};
 };
 };  // namespace deepmd
diff --git a/source/lib/include/neighbor_list.h b/source/lib/include/neighbor_list.h
index eb510eb25b..39c2064b56 100644
--- a/source/lib/include/neighbor_list.h
+++ b/source/lib/include/neighbor_list.h
@@ -26,13 +26,13 @@ struct InputNlist {
   int* numneigh;
   /// Array stores the core region atom's neighbor index
   int** firstneigh;
-  InputNlist() : inum(0), ilist(NULL), numneigh(NULL), firstneigh(NULL){};
+  InputNlist() : inum(0), ilist(NULL), numneigh(NULL), firstneigh(NULL) {};
   InputNlist(int inum_, int* ilist_, int* numneigh_, int** firstneigh_)
       : inum(inum_),
         ilist(ilist_),
         numneigh(numneigh_),
-        firstneigh(firstneigh_){};
-  ~InputNlist(){};
+        firstneigh(firstneigh_) {};
+  ~InputNlist() {};
 };
 
 /**
diff --git a/source/lmp/env.sh.in b/source/lmp/env.sh.in
index 8c3a7aedc1..55b90be886 100644
--- a/source/lmp/env.sh.in
+++ b/source/lmp/env.sh.in
@@ -1,6 +1,6 @@
 DEEPMD_ROOT=@CMAKE_INSTALL_PREFIX@
-TENSORFLOW_INCLUDE_DIRS="@TensorFlow_INCLUDE_DIRS@"
-TENSORFLOW_LIBRARY_PATH="@TensorFlow_LIBRARY_PATH@"
+TENSORFLOW_INCLUDE_DIRS="@BACKEND_INCLUDE_DIRS@"
+TENSORFLOW_LIBRARY_PATH="@BACKEND_LIBRARY_PATH@"
 
 TF_INCLUDE_DIRS=`echo $TENSORFLOW_INCLUDE_DIRS | sed "s/;/ -I/g"`
 TF_LIBRARY_PATH=`echo $TENSORFLOW_LIBRARY_PATH | sed "s/;/ -L/g"`
diff --git a/source/lmp/env_c.sh.in b/source/lmp/env_c.sh.in
index 67f6a63a1c..af010497ba 100644
--- a/source/lmp/env_c.sh.in
+++ b/source/lmp/env_c.sh.in
@@ -1,6 +1,6 @@
 DEEPMD_ROOT=@CMAKE_INSTALL_PREFIX@
-TENSORFLOW_INCLUDE_DIRS="@TensorFlow_INCLUDE_DIRS@"
-TENSORFLOW_LIBRARY_PATH="@TensorFlow_LIBRARY_PATH@"
+TENSORFLOW_INCLUDE_DIRS="@BACKEND_INCLUDE_DIRS@"
+TENSORFLOW_LIBRARY_PATH="@BACKEND_LIBRARY_PATH@"
 
 TF_INCLUDE_DIRS=`echo $TENSORFLOW_INCLUDE_DIRS | sed "s/;/ -I/g"`
 TF_LIBRARY_PATH=`echo $TENSORFLOW_LIBRARY_PATH | sed "s/;/ -L/g"`
diff --git a/source/lmp/env_py.sh.in b/source/lmp/env_py.sh.in
index e6fc217c26..be48191f33 100644
--- a/source/lmp/env_py.sh.in
+++ b/source/lmp/env_py.sh.in
@@ -1,6 +1,6 @@
 DEEPMD_ROOT=@CMAKE_INSTALL_PREFIX@
-TENSORFLOW_INCLUDE_DIRS="@TensorFlow_INCLUDE_DIRS@"
-TENSORFLOW_LIBRARY_PATH="@TensorFlow_LIBRARY_PATH@"
+TENSORFLOW_INCLUDE_DIRS="@BACKEND_INCLUDE_DIRS@"
+TENSORFLOW_LIBRARY_PATH="@BACKEND_LIBRARY_PATH@"
 PYTHON_LIBRARY_PATH="@Python_LIBRARY_DIRS@"
 
 TF_INCLUDE_DIRS=`echo $TENSORFLOW_INCLUDE_DIRS | sed "s/;/ -I/g"`
diff --git a/source/lmp/env_py_c.sh.in b/source/lmp/env_py_c.sh.in
index b8affd7ff5..34874cc24c 100644
--- a/source/lmp/env_py_c.sh.in
+++ b/source/lmp/env_py_c.sh.in
@@ -1,6 +1,6 @@
 DEEPMD_ROOT=@CMAKE_INSTALL_PREFIX@
-TENSORFLOW_INCLUDE_DIRS="@TensorFlow_INCLUDE_DIRS@"
-TENSORFLOW_LIBRARY_PATH="@TensorFlow_LIBRARY_PATH@"
+TENSORFLOW_INCLUDE_DIRS="@BACKEND_INCLUDE_DIRS@"
+TENSORFLOW_LIBRARY_PATH="@BACKEND_LIBRARY_PATH@"
 PYTHON_LIBRARY_PATH="@Python_LIBRARY_DIRS@"
 
 TF_INCLUDE_DIRS=`echo $TENSORFLOW_INCLUDE_DIRS | sed "s/;/ -I/g"`
diff --git a/source/lmp/pair_deepmd.cpp b/source/lmp/pair_deepmd.cpp
index 90aa453143..1a64fdb869 100644
--- a/source/lmp/pair_deepmd.cpp
+++ b/source/lmp/pair_deepmd.cpp
@@ -218,7 +218,9 @@ void PairDeepMD::make_fparam_from_compute(vector<double> &fparam) {
   int icompute = modify->find_compute(compute_fparam_id);
   Compute *compute = modify->compute[icompute];
 
-  assert(compute);
+  if (!compute) {
+    error->all(FLERR, "compute id is not found: " + compute_fparam_id);
+  }
   fparam.resize(dim_fparam);
 
   if (dim_fparam == 1) {
@@ -245,7 +247,9 @@ void PairDeepMD::make_aparam_from_compute(vector<double> &aparam) {
   int icompute = modify->find_compute(compute_aparam_id);
   Compute *compute = modify->compute[icompute];
 
-  assert(compute);
+  if (!compute) {
+    error->all(FLERR, "compute id is not found: " + compute_aparam_id);
+  }
   int nlocal = atom->nlocal;
   aparam.resize(static_cast<size_t>(dim_aparam) * nlocal);
 
@@ -276,7 +280,9 @@ void PairDeepMD::make_ttm_fparam(vector<double> &fparam) {
       ttm_fix = dynamic_cast<FixTTMDP *>(modify->fix[ii]);
     }
   }
-  assert(ttm_fix);
+  if (!ttm_fix) {
+    error->all(FLERR, "fix ttm id is not found: " + ttm_fix_id);
+  }
 
   fparam.resize(dim_fparam);
 
@@ -315,7 +321,9 @@ void PairDeepMD::make_ttm_aparam(vector<double> &daparam) {
       ttm_fix = dynamic_cast<FixTTMDP *>(modify->fix[ii]);
     }
   }
-  assert(ttm_fix);
+  if (!ttm_fix) {
+    error->all(FLERR, "fix ttm id is not found: " + ttm_fix_id);
+  }
   // modify
   double **x = atom->x;
   int *mask = atom->mask;
diff --git a/source/lmp/plugin/CMakeLists.txt b/source/lmp/plugin/CMakeLists.txt
index 4fdae7ac5b..f912059261 100644
--- a/source/lmp/plugin/CMakeLists.txt
+++ b/source/lmp/plugin/CMakeLists.txt
@@ -99,7 +99,7 @@ if(DEFINED LAMMPS_SOURCE_ROOT OR DEFINED LAMMPS_VERSION)
                                                 "-Wl,-undefined,dynamic_lookup")
   else()
     set_target_properties(
-      ${libname} PROPERTIES INSTALL_RPATH "$ORIGIN;${TensorFlow_LIBRARY_PATH}"
+      ${libname} PROPERTIES INSTALL_RPATH "$ORIGIN;${BACKEND_LIBRARY_PATH}"
                             LINK_FLAGS "-rdynamic")
   endif()
   target_compile_definitions(
diff --git a/source/lmp/pppm_dplr.h b/source/lmp/pppm_dplr.h
index e87fc6a241..1484a16e72 100644
--- a/source/lmp/pppm_dplr.h
+++ b/source/lmp/pppm_dplr.h
@@ -25,7 +25,7 @@ class PPPMDPLR : public PPPM {
 #else
   PPPMDPLR(class LAMMPS *);
 #endif
-  ~PPPMDPLR() override{};
+  ~PPPMDPLR() override {};
   void init() override;
   const std::vector<double> &get_fele() const { return fele; };
 
diff --git a/source/md/include/Integrator.h b/source/md/include/Integrator.h
index 73e84e7097..945109fb20 100644
--- a/source/md/include/Integrator.h
+++ b/source/md/include/Integrator.h
@@ -9,7 +9,7 @@
 template <typename VALUETYPE>
 class Integrator {
  public:
-  Integrator() : massConst(UnitManager::IntegratorMassConstant){};
+  Integrator() : massConst(UnitManager::IntegratorMassConstant) {};
 
  public:
   void stepVeloc(std::vector<VALUETYPE>& vv,
diff --git a/source/md/include/Tabulated.h b/source/md/include/Tabulated.h
index 5ab6e02bc3..4c618db213 100644
--- a/source/md/include/Tabulated.h
+++ b/source/md/include/Tabulated.h
@@ -13,7 +13,7 @@ typedef float VALUETYPE;
 
 class Tabulated {
  public:
-  Tabulated(){};
+  Tabulated() {};
   Tabulated(const VALUETYPE rc,
             const VALUETYPE hh,
             const std::vector<VALUETYPE>& tab);
diff --git a/source/md/include/Trajectory.h b/source/md/include/Trajectory.h
index 862b393ea4..52964f3b37 100644
--- a/source/md/include/Trajectory.h
+++ b/source/md/include/Trajectory.h
@@ -11,7 +11,7 @@
 
 class XtcSaver {
  public:
-  XtcSaver() : inited(false), prec(1000){};
+  XtcSaver() : inited(false), prec(1000) {};
   ~XtcSaver();
   XtcSaver(const char *filename, const int &natoms);
   bool reinit(const char *filename, const int &natoms);
@@ -33,7 +33,7 @@ class XtcSaver {
 
 class TrrSaver {
  public:
-  TrrSaver() : inited(false), lambda(0){};
+  TrrSaver() : inited(false), lambda(0) {};
   ~TrrSaver();
   TrrSaver(const char *filename, const int &natoms);
   bool reinit(const char *filename, const int &natoms);
diff --git a/source/md/include/UnitManager.h b/source/md/include/UnitManager.h
index 70393c406e..9bd1e75b9a 100644
--- a/source/md/include/UnitManager.h
+++ b/source/md/include/UnitManager.h
@@ -5,7 +5,7 @@
 
 class UnitManager {
  protected:
-  UnitManager(){};
+  UnitManager() {};
 
  public:
   static double Degree2Radian;
diff --git a/source/nodejs/yarn.lock b/source/nodejs/yarn.lock
index fb0c093f11..be1be837d6 100644
--- a/source/nodejs/yarn.lock
+++ b/source/nodejs/yarn.lock
@@ -619,9 +619,9 @@ strip-ansi@^6.0.1:
     ansi-regex "^5.0.1"
 
 tar@^6.1.11, tar@^6.1.2:
-  version "6.1.14"
-  resolved "https://registry.yarnpkg.com/tar/-/tar-6.1.14.tgz#e87926bec1cfe7c9e783a77a79f3e81c1cfa3b66"
-  integrity sha512-piERznXu0U7/pW7cdSn7hjqySIVTYT6F76icmFk7ptU7dDYlXTm5r9A6K04R2vU3olYgoKeo1Cg3eeu5nhftAw==
+  version "6.2.1"
+  resolved "https://registry.yarnpkg.com/tar/-/tar-6.2.1.tgz#717549c541bc3c2af15751bea94b1dd068d4b03a"
+  integrity sha512-DZ4yORTwrbTj/7MZYq2w+/ZFdI6OZ/f9SFHR+71gIVUZhOQPHzVCLpvRnPgyaMpfWxxk/4ONva3GQSyNIKRv6A==
   dependencies:
     chownr "^2.0.0"
     fs-minipass "^2.0.0"
diff --git a/source/op/CMakeLists.txt b/source/op/CMakeLists.txt
index 7a92e259e0..6fc6422c6e 100644
--- a/source/op/CMakeLists.txt
+++ b/source/op/CMakeLists.txt
@@ -62,11 +62,10 @@ endif()
 if(APPLE)
   set_target_properties(
     ${LIB_DEEPMD_OP} PROPERTIES INSTALL_RPATH
-                                "@loader_path;${TensorFlow_LIBRARY_PATH}")
+                                "@loader_path;${BACKEND_LIBRARY_PATH}")
 else()
   set_target_properties(
-    ${LIB_DEEPMD_OP} PROPERTIES INSTALL_RPATH
-                                "$ORIGIN;${TensorFlow_LIBRARY_PATH}")
+    ${LIB_DEEPMD_OP} PROPERTIES INSTALL_RPATH "$ORIGIN;${BACKEND_LIBRARY_PATH}")
 endif()
 if(CMAKE_TESTING_ENABLED)
   target_link_libraries(${LIB_DEEPMD_OP} PRIVATE coverage_config)
diff --git a/source/op/add_flt_nvnmd.cc b/source/op/add_flt_nvnmd.cc
index 079e05d785..db3554665a 100644
--- a/source/op/add_flt_nvnmd.cc
+++ b/source/op/add_flt_nvnmd.cc
@@ -52,7 +52,7 @@ template <typename Device, typename FPTYPE>
 class AddFltNvnmdOp : public OpKernel {
  public:
   /// Constructor.
-  explicit AddFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context){};
+  explicit AddFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context) {};
 
   /// Compute the descriptor
   /// param: context
diff --git a/source/op/copy_flt_nvnmd.cc b/source/op/copy_flt_nvnmd.cc
index d9a1984115..3ca9b17c31 100644
--- a/source/op/copy_flt_nvnmd.cc
+++ b/source/op/copy_flt_nvnmd.cc
@@ -50,7 +50,7 @@ template <typename Device, typename FPTYPE>
 class CopyFltNvnmdOp : public OpKernel {
  public:
   /// Constructor.
-  explicit CopyFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context){};
+  explicit CopyFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context) {};
 
   /// Compute the descriptor
   /// param: context
diff --git a/source/op/dotmul_flt_nvnmd.cc b/source/op/dotmul_flt_nvnmd.cc
index d7c2c8d3c3..1aca3e8bf8 100644
--- a/source/op/dotmul_flt_nvnmd.cc
+++ b/source/op/dotmul_flt_nvnmd.cc
@@ -61,7 +61,7 @@ class DotmulFltNvnmdOp : public OpKernel {
  public:
   /// Constructor.
   explicit DotmulFltNvnmdOp(OpKernelConstruction *context)
-      : OpKernel(context){};
+      : OpKernel(context) {};
 
   /// Compute the descriptor
   /// param: context
diff --git a/source/op/flt_nvnmd.cc b/source/op/flt_nvnmd.cc
index 634c76b662..4794caeedc 100644
--- a/source/op/flt_nvnmd.cc
+++ b/source/op/flt_nvnmd.cc
@@ -48,7 +48,7 @@ template <typename Device, typename FPTYPE>
 class FltNvnmdOp : public OpKernel {
  public:
   /// Constructor.
-  explicit FltNvnmdOp(OpKernelConstruction* context) : OpKernel(context){};
+  explicit FltNvnmdOp(OpKernelConstruction* context) : OpKernel(context) {};
 
   /// Compute the descriptor
   /// param: context
diff --git a/source/op/mul_flt_nvnmd.cc b/source/op/mul_flt_nvnmd.cc
index d18cf20508..bbbeec073d 100644
--- a/source/op/mul_flt_nvnmd.cc
+++ b/source/op/mul_flt_nvnmd.cc
@@ -52,7 +52,7 @@ template <typename Device, typename FPTYPE>
 class MulFltNvnmdOp : public OpKernel {
  public:
   /// Constructor.
-  explicit MulFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context){};
+  explicit MulFltNvnmdOp(OpKernelConstruction* context) : OpKernel(context) {};
 
   /// Compute the descriptor
   /// param: context
diff --git a/source/tests/common.py b/source/tests/common.py
index 5a7477d7e7..d9b300f640 100644
--- a/source/tests/common.py
+++ b/source/tests/common.py
@@ -663,8 +663,7 @@ def __init__(self, sys_path, set_prefix, seed=None, shuffle_test=True):
         ]
         if any(has_fparam) and (not all(has_fparam)):
             raise RuntimeError(
-                "system %s: if any set has frame parameter, then all sets should have frame parameter"
-                % sys_path
+                f"system {sys_path}: if any set has frame parameter, then all sets should have frame parameter"
             )
         if all(has_fparam):
             self.has_fparam = 0
@@ -676,8 +675,7 @@ def __init__(self, sys_path, set_prefix, seed=None, shuffle_test=True):
         ]
         if any(has_aparam) and (not all(has_aparam)):
             raise RuntimeError(
-                "system %s: if any set has frame parameter, then all sets should have frame parameter"
-                % sys_path
+                f"system {sys_path}: if any set has frame parameter, then all sets should have frame parameter"
             )
         if all(has_aparam):
             self.has_aparam = 0
@@ -767,7 +765,7 @@ def load_data(self, set_name, data_name, shape, is_necessary=True):
                 return data
             return 1, data
         elif is_necessary:
-            raise OSError("%s not found!" % path)
+            raise OSError(f"{path} not found!")
         else:
             data = np.zeros(shape)
         return 0, data
@@ -1021,7 +1019,7 @@ def print_summary(self):
         sys_width = 42
         tmp_msg += "---Summary of DataSystem-----------------------------------------\n"
         tmp_msg += "find %d system(s):\n" % self.nsystems
-        tmp_msg += "%s  " % self.format_name_length("system", sys_width)
+        tmp_msg += "{}  ".format(self.format_name_length("system", sys_width))
         tmp_msg += "{}  {}  {}\n".format("natoms", "bch_sz", "n_bch")
         for ii in range(self.nsystems):
             tmp_msg += "%s  %6d  %6d  %5d\n" % (
diff --git a/source/tests/test_model_compression_se_atten.py b/source/tests/test_model_compression_se_atten.py
index 0752635a98..9c245d8900 100644
--- a/source/tests/test_model_compression_se_atten.py
+++ b/source/tests/test_model_compression_se_atten.py
@@ -28,36 +28,36 @@ def _file_delete(file):
         os.remove(file)
 
 
-# 4 tests:
-# - type embedding FP64, se_atten FP64
-# - type embedding FP64, se_atten FP32
-# - type embedding FP32, se_atten FP64
-# - type embedding FP32, se_atten FP32
 tests = [
     {
         "se_atten precision": "float64",
         "type embedding precision": "float64",
-        "smooth_type_embdding": True,
+        "smooth_type_embedding": True,
+        "precision_digit": 10,
     },
     {
         "se_atten precision": "float64",
         "type embedding precision": "float64",
-        "smooth_type_embdding": False,
+        "smooth_type_embedding": False,
+        "precision_digit": 10,
     },
     {
         "se_atten precision": "float64",
         "type embedding precision": "float32",
-        "smooth_type_embdding": True,
+        "smooth_type_embedding": True,
+        "precision_digit": 2,
     },
     {
         "se_atten precision": "float32",
         "type embedding precision": "float64",
-        "smooth_type_embdding": True,
+        "smooth_type_embedding": True,
+        "precision_digit": 2,
     },
     {
         "se_atten precision": "float32",
         "type embedding precision": "float32",
-        "smooth_type_embdding": True,
+        "smooth_type_embedding": True,
+        "precision_digit": 2,
     },
 ]
 
@@ -82,8 +82,8 @@ def _init_models():
         jdata["model"]["descriptor"]["stripped_type_embedding"] = True
         jdata["model"]["descriptor"]["sel"] = 120
         jdata["model"]["descriptor"]["attn_layer"] = 0
-        jdata["model"]["descriptor"]["smooth_type_embdding"] = tests[i][
-            "smooth_type_embdding"
+        jdata["model"]["descriptor"]["smooth_type_embedding"] = tests[i][
+            "smooth_type_embedding"
         ]
         jdata["model"]["type_embedding"] = {}
         jdata["model"]["type_embedding"]["precision"] = tests[i][
@@ -158,10 +158,6 @@ def _init_models_exclude_types():
 INPUTS_ET, FROZEN_MODELS_ET, COMPRESSED_MODELS_ET = _init_models_exclude_types()
 
 
-def _get_default_places(nth_test):
-    return 10 if nth_test == 0 else 3
-
-
 @unittest.skipIf(
     parse_version(tf.__version__) < parse_version("2"),
     f"The current tf version {tf.__version__} is too low to run the new testing model.",
@@ -200,7 +196,7 @@ def test_attrs(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             self.assertEqual(dp_original.get_ntypes(), 2)
             self.assertAlmostEqual(dp_original.get_rcut(), 6.0, places=default_places)
@@ -218,7 +214,7 @@ def test_1frame(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=False
@@ -244,7 +240,7 @@ def test_1frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0, ae0, av0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=True
@@ -276,7 +272,7 @@ def test_2frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             coords2 = np.concatenate((self.coords, self.coords))
             box2 = np.concatenate((self.box, self.box))
@@ -346,7 +342,7 @@ def test_1frame(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=False
@@ -372,7 +368,7 @@ def test_1frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0, ae0, av0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=True
@@ -404,7 +400,7 @@ def test_2frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             coords2 = np.concatenate((self.coords, self.coords))
             ee0, ff0, vv0, ae0, av0 = dp_original.eval(
@@ -473,7 +469,7 @@ def test_1frame(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=False
@@ -505,7 +501,7 @@ def test_1frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0, ae0, av0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=True
@@ -535,7 +531,7 @@ def test_1frame_atm(self):
 
     def test_ase(self):
         for i in range(len(tests)):
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
             from ase import (
                 Atoms,
             )
@@ -628,7 +624,7 @@ def test_attrs(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             self.assertEqual(dp_original.get_ntypes(), 2)
             self.assertAlmostEqual(dp_original.get_rcut(), 6.0, places=default_places)
@@ -646,7 +642,7 @@ def test_1frame(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=False
@@ -672,7 +668,7 @@ def test_1frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             ee0, ff0, vv0, ae0, av0 = dp_original.eval(
                 self.coords, self.box, self.atype, atomic=True
@@ -704,7 +700,7 @@ def test_2frame_atm(self):
         for i in range(len(tests)):
             dp_original = self.dp_originals[i]
             dp_compressed = self.dp_compresseds[i]
-            default_places = _get_default_places(i)
+            default_places = tests[i]["precision_digit"]
 
             coords2 = np.concatenate((self.coords, self.coords))
             box2 = np.concatenate((self.box, self.box))
diff --git a/source/tests/test_model_se_atten.py b/source/tests/test_model_se_atten.py
index 5417201a9f..cb9ff6f5ad 100644
--- a/source/tests/test_model_se_atten.py
+++ b/source/tests/test_model_se_atten.py
@@ -751,7 +751,7 @@ def test_smoothness_of_stripped_type_embedding_smooth_model(self):
         jdata["model"]["descriptor"].pop("type", None)
         jdata["model"]["descriptor"]["ntypes"] = 2
         jdata["model"]["descriptor"]["stripped_type_embedding"] = True
-        jdata["model"]["descriptor"]["smooth_type_embdding"] = True
+        jdata["model"]["descriptor"]["smooth_type_embedding"] = True
         jdata["model"]["descriptor"]["attn_layer"] = 1
         jdata["model"]["descriptor"]["rcut"] = 6.0
         jdata["model"]["descriptor"]["rcut_smth"] = 4.0
@@ -874,3 +874,131 @@ def test_smoothness_of_stripped_type_embedding_smooth_model(self):
             np.testing.assert_allclose(de[0], de[1], rtol=0, atol=deltae)
             np.testing.assert_allclose(df[0], df[1], rtol=0, atol=deltad)
             np.testing.assert_allclose(dv[0], dv[1], rtol=0, atol=deltad)
+
+    def test_smoothness_of_stripped_type_embedding_smooth_model_excluded_types(self):
+        """test: auto-diff, continuity of e,f,v."""
+        jfile = "water_se_atten.json"
+        jdata = j_loader(jfile)
+
+        systems = j_must_have(jdata, "systems")
+        set_pfx = j_must_have(jdata, "set_prefix")
+        batch_size = 1
+        test_size = 1
+        rcut = j_must_have(jdata["model"]["descriptor"], "rcut")
+
+        data = DataSystem(systems, set_pfx, batch_size, test_size, rcut, run_opt=None)
+
+        test_data = data.get_test()
+        numb_test = 1
+
+        jdata["model"]["descriptor"].pop("type", None)
+        jdata["model"]["descriptor"]["ntypes"] = 2
+        jdata["model"]["descriptor"]["stripped_type_embedding"] = True
+        jdata["model"]["descriptor"]["smooth_type_embedding"] = True
+        jdata["model"]["descriptor"]["attn_layer"] = 1
+        jdata["model"]["descriptor"]["rcut"] = 6.0
+        jdata["model"]["descriptor"]["rcut_smth"] = 4.0
+        jdata["model"]["descriptor"]["exclude_types"] = [[0, 0], [0, 1]]
+        jdata["model"]["descriptor"]["set_davg_zero"] = False
+        descrpt = DescrptSeAtten(**jdata["model"]["descriptor"], uniform_seed=True)
+        jdata["model"]["fitting_net"]["descrpt"] = descrpt
+        fitting = EnerFitting(**jdata["model"]["fitting_net"], uniform_seed=True)
+        typeebd_param = jdata["model"]["type_embedding"]
+        typeebd = TypeEmbedNet(
+            ntypes=descrpt.get_ntypes(),
+            neuron=typeebd_param["neuron"],
+            activation_function=None,
+            resnet_dt=typeebd_param["resnet_dt"],
+            seed=typeebd_param["seed"],
+            uniform_seed=True,
+            padding=True,
+        )
+        model = EnerModel(descrpt, fitting, typeebd)
+
+        input_data = {
+            "coord": [test_data["coord"]],
+            "box": [test_data["box"]],
+            "type": [test_data["type"]],
+            "natoms_vec": [test_data["natoms_vec"]],
+            "default_mesh": [test_data["default_mesh"]],
+        }
+        model._compute_input_stat(input_data)
+        model.descrpt.bias_atom_e = data.compute_energy_shift()
+        # make the original implementation failed
+        model.descrpt.davg[:] += 1e-1
+
+        t_prop_c = tf.placeholder(tf.float32, [5], name="t_prop_c")
+        t_energy = tf.placeholder(GLOBAL_ENER_FLOAT_PRECISION, [None], name="t_energy")
+        t_force = tf.placeholder(GLOBAL_TF_FLOAT_PRECISION, [None], name="t_force")
+        t_virial = tf.placeholder(GLOBAL_TF_FLOAT_PRECISION, [None], name="t_virial")
+        t_atom_ener = tf.placeholder(
+            GLOBAL_TF_FLOAT_PRECISION, [None], name="t_atom_ener"
+        )
+        t_coord = tf.placeholder(GLOBAL_TF_FLOAT_PRECISION, [None], name="i_coord")
+        t_type = tf.placeholder(tf.int32, [None], name="i_type")
+        t_natoms = tf.placeholder(tf.int32, [model.ntypes + 2], name="i_natoms")
+        t_box = tf.placeholder(GLOBAL_TF_FLOAT_PRECISION, [None, 9], name="i_box")
+        t_mesh = tf.placeholder(tf.int32, [None], name="i_mesh")
+        is_training = tf.placeholder(tf.bool)
+        inputs_dict = {}
+
+        model_pred = model.build(
+            t_coord,
+            t_type,
+            t_natoms,
+            t_box,
+            t_mesh,
+            inputs_dict,
+            suffix=self.filename
+            + "-"
+            + inspect.stack()[0][3]
+            + "test_model_se_atten_model_compressible_excluded_types",
+            reuse=False,
+        )
+        energy = model_pred["energy"]
+        force = model_pred["force"]
+        virial = model_pred["virial"]
+
+        feed_dict_test = {
+            t_prop_c: test_data["prop_c"],
+            t_energy: test_data["energy"][:numb_test],
+            t_force: np.reshape(test_data["force"][:numb_test, :], [-1]),
+            t_virial: np.reshape(test_data["virial"][:numb_test, :], [-1]),
+            t_atom_ener: np.reshape(test_data["atom_ener"][:numb_test, :], [-1]),
+            t_coord: np.reshape(test_data["coord"][:numb_test, :], [-1]),
+            t_box: test_data["box"][:numb_test, :],
+            t_type: np.reshape(test_data["type"][:numb_test, :], [-1]),
+            t_natoms: test_data["natoms_vec"],
+            t_mesh: test_data["default_mesh"],
+            is_training: False,
+        }
+        sess = self.cached_session().__enter__()
+        sess.run(tf.global_variables_initializer())
+        [pe, pf, pv] = sess.run([energy, force, virial], feed_dict=feed_dict_test)
+        pf, pv = pf.reshape(-1), pv.reshape(-1)
+
+        eps = 1e-4
+        delta = 1e-6
+        fdf, fdv = finite_difference_fv(
+            sess, energy, feed_dict_test, t_coord, t_box, delta=eps
+        )
+        np.testing.assert_allclose(pf, fdf, delta)
+        np.testing.assert_allclose(pv, fdv, delta)
+
+        tested_eps = [1e-3, 1e-4, 1e-5, 1e-6, 1e-7]
+        for eps in tested_eps:
+            deltae = 1e-15
+            deltad = 1e-15
+            de, df, dv = check_smooth_efv(
+                sess,
+                energy,
+                force,
+                virial,
+                feed_dict_test,
+                t_coord,
+                jdata["model"]["descriptor"]["rcut"],
+                delta=eps,
+            )
+            np.testing.assert_allclose(de[0], de[1], rtol=0, atol=deltae)
+            np.testing.assert_allclose(df[0], df[1], rtol=0, atol=deltad)
+            np.testing.assert_allclose(dv[0], dv[1], rtol=0, atol=deltad)