From 8356629395cd1e183373f31f76cc32675c609287 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 16:10:11 +0800
Subject: [PATCH 01/63] feat(pt_expt): add dos, dipole, polar and property
 fittings

---
 .../dpmodel/fitting/polarizability_fitting.py |   4 +-
 deepmd/pt_expt/fitting/__init__.py            |  16 +++
 deepmd/pt_expt/fitting/dipole_fitting.py      |  23 ++++
 deepmd/pt_expt/fitting/dos_fitting.py         |  23 ++++
 .../pt_expt/fitting/polarizability_fitting.py |  23 ++++
 deepmd/pt_expt/fitting/property_fitting.py    |  25 ++++
 .../tests/consistent/fitting/test_dipole.py   |  25 ++++
 source/tests/consistent/fitting/test_dos.py   |  36 +++++
 source/tests/consistent/fitting/test_polar.py |  25 ++++
 .../tests/consistent/fitting/test_property.py |  39 ++++++
 .../pt_expt/fitting/test_dipole_fitting.py    | 128 ++++++++++++++++++
 .../tests/pt_expt/fitting/test_dos_fitting.py | 120 ++++++++++++++++
 ...g_ener_fitting.py => test_ener_fitting.py} |   0
 ...invar_fitting.py => test_invar_fitting.py} |   0
 .../pt_expt/fitting/test_polar_fitting.py     | 125 +++++++++++++++++
 .../pt_expt/fitting/test_property_fitting.py  | 120 ++++++++++++++++
 16 files changed, 731 insertions(+), 1 deletion(-)
 create mode 100644 deepmd/pt_expt/fitting/dipole_fitting.py
 create mode 100644 deepmd/pt_expt/fitting/dos_fitting.py
 create mode 100644 deepmd/pt_expt/fitting/polarizability_fitting.py
 create mode 100644 deepmd/pt_expt/fitting/property_fitting.py
 create mode 100644 source/tests/pt_expt/fitting/test_dipole_fitting.py
 create mode 100644 source/tests/pt_expt/fitting/test_dos_fitting.py
 rename source/tests/pt_expt/fitting/{test_fitting_ener_fitting.py => test_ener_fitting.py} (100%)
 rename source/tests/pt_expt/fitting/{test_fitting_invar_fitting.py => test_invar_fitting.py} (100%)
 create mode 100644 source/tests/pt_expt/fitting/test_polar_fitting.py
 create mode 100644 source/tests/pt_expt/fitting/test_property_fitting.py

diff --git a/deepmd/dpmodel/fitting/polarizability_fitting.py b/deepmd/dpmodel/fitting/polarizability_fitting.py
index f3e6318ba5..dff86f04cb 100644
--- a/deepmd/dpmodel/fitting/polarizability_fitting.py
+++ b/deepmd/dpmodel/fitting/polarizability_fitting.py
@@ -328,7 +328,9 @@ def call(
             )
             # (nframes, nloc, 1)
             bias = bias[..., None] * scale_atype
-            eye = xp.eye(3, dtype=descriptor.dtype)
+            eye = xp.eye(
+                3, dtype=descriptor.dtype, device=array_api_compat.device(descriptor)
+            )
             eye = xp.tile(eye, (nframes, nloc, 1, 1))
             # (nframes, nloc, 3, 3)
             bias = bias[..., None] * eye
diff --git a/deepmd/pt_expt/fitting/__init__.py b/deepmd/pt_expt/fitting/__init__.py
index 4a7c8100de..3b69392cfd 100644
--- a/deepmd/pt_expt/fitting/__init__.py
+++ b/deepmd/pt_expt/fitting/__init__.py
@@ -2,15 +2,31 @@
 from .base_fitting import (
     BaseFitting,
 )
+from .dipole_fitting import (
+    DipoleFitting,
+)
+from .dos_fitting import (
+    DOSFittingNet,
+)
 from .ener_fitting import (
     EnergyFittingNet,
 )
 from .invar_fitting import (
     InvarFitting,
 )
+from .polarizability_fitting import (
+    PolarFitting,
+)
+from .property_fitting import (
+    PropertyFittingNet,
+)
 
 __all__ = [
     "BaseFitting",
+    "DOSFittingNet",
+    "DipoleFitting",
     "EnergyFittingNet",
     "InvarFitting",
+    "PolarFitting",
+    "PropertyFittingNet",
 ]
diff --git a/deepmd/pt_expt/fitting/dipole_fitting.py b/deepmd/pt_expt/fitting/dipole_fitting.py
new file mode 100644
index 0000000000..a16a96fe72
--- /dev/null
+++ b/deepmd/pt_expt/fitting/dipole_fitting.py
@@ -0,0 +1,23 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+
+from deepmd.dpmodel.fitting.dipole_fitting import DipoleFitting as DipoleFittingDP
+from deepmd.pt_expt.common import (
+    register_dpmodel_mapping,
+    torch_module,
+)
+
+from .base_fitting import (
+    BaseFitting,
+)
+
+
+@BaseFitting.register("dipole")
+@torch_module
+class DipoleFitting(DipoleFittingDP):
+    pass
+
+
+register_dpmodel_mapping(
+    DipoleFittingDP,
+    lambda v: DipoleFitting.deserialize(v.serialize()),
+)
diff --git a/deepmd/pt_expt/fitting/dos_fitting.py b/deepmd/pt_expt/fitting/dos_fitting.py
new file mode 100644
index 0000000000..8c51fcc0eb
--- /dev/null
+++ b/deepmd/pt_expt/fitting/dos_fitting.py
@@ -0,0 +1,23 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+
+from deepmd.dpmodel.fitting.dos_fitting import DOSFittingNet as DOSFittingNetDP
+from deepmd.pt_expt.common import (
+    register_dpmodel_mapping,
+    torch_module,
+)
+
+from .base_fitting import (
+    BaseFitting,
+)
+
+
+@BaseFitting.register("dos")
+@torch_module
+class DOSFittingNet(DOSFittingNetDP):
+    pass
+
+
+register_dpmodel_mapping(
+    DOSFittingNetDP,
+    lambda v: DOSFittingNet.deserialize(v.serialize()),
+)
diff --git a/deepmd/pt_expt/fitting/polarizability_fitting.py b/deepmd/pt_expt/fitting/polarizability_fitting.py
new file mode 100644
index 0000000000..564df7e0d7
--- /dev/null
+++ b/deepmd/pt_expt/fitting/polarizability_fitting.py
@@ -0,0 +1,23 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+
+from deepmd.dpmodel.fitting.polarizability_fitting import PolarFitting as PolarFittingDP
+from deepmd.pt_expt.common import (
+    register_dpmodel_mapping,
+    torch_module,
+)
+
+from .base_fitting import (
+    BaseFitting,
+)
+
+
+@BaseFitting.register("polar")
+@torch_module
+class PolarFitting(PolarFittingDP):
+    pass
+
+
+register_dpmodel_mapping(
+    PolarFittingDP,
+    lambda v: PolarFitting.deserialize(v.serialize()),
+)
diff --git a/deepmd/pt_expt/fitting/property_fitting.py b/deepmd/pt_expt/fitting/property_fitting.py
new file mode 100644
index 0000000000..318e30fad6
--- /dev/null
+++ b/deepmd/pt_expt/fitting/property_fitting.py
@@ -0,0 +1,25 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+
+from deepmd.dpmodel.fitting.property_fitting import (
+    PropertyFittingNet as PropertyFittingNetDP,
+)
+from deepmd.pt_expt.common import (
+    register_dpmodel_mapping,
+    torch_module,
+)
+
+from .base_fitting import (
+    BaseFitting,
+)
+
+
+@BaseFitting.register("property")
+@torch_module
+class PropertyFittingNet(PropertyFittingNetDP):
+    pass
+
+
+register_dpmodel_mapping(
+    PropertyFittingNetDP,
+    lambda v: PropertyFittingNet.deserialize(v.serialize()),
+)
diff --git a/source/tests/consistent/fitting/test_dipole.py b/source/tests/consistent/fitting/test_dipole.py
index c81499611f..245744a93e 100644
--- a/source/tests/consistent/fitting/test_dipole.py
+++ b/source/tests/consistent/fitting/test_dipole.py
@@ -18,6 +18,7 @@
     INSTALLED_ARRAY_API_STRICT,
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
     parameterized,
@@ -33,6 +34,13 @@
     from deepmd.pt.utils.env import DEVICE as PT_DEVICE
 else:
     DipoleFittingPT = object
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.fitting.dipole_fitting import (
+        DipoleFitting as DipoleFittingPTExpt,
+    )
+    from deepmd.pt_expt.utils.env import DEVICE as PT_EXPT_DEVICE
+else:
+    DipoleFittingPTExpt = None
 if INSTALLED_TF:
     from deepmd.tf.fit.dipole import DipoleFittingSeA as DipoleFittingTF
 else:
@@ -116,12 +124,17 @@ def skip_pt(self) -> bool:
     tf_class = DipoleFittingTF
     dp_class = DipoleFittingDP
     pt_class = DipoleFittingPT
+    pt_expt_class = DipoleFittingPTExpt
     jax_class = DipoleFittingJAX
     array_api_strict_class = DipoleFittingArrayAPIStrict
     args = fitting_dipole()
     skip_jax = not INSTALLED_JAX
     skip_array_api_strict = not INSTALLED_ARRAY_API_STRICT
 
+    @property
+    def skip_pt_expt(self) -> bool:
+        return CommonTest.skip_pt_expt
+
     def setUp(self) -> None:
         CommonTest.setUp(self)
 
@@ -184,6 +197,18 @@ def eval_pt(self, pt_obj: Any) -> Any:
             .numpy()
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return (
+            pt_expt_obj(
+                torch.from_numpy(self.inputs).to(device=PT_EXPT_DEVICE),
+                torch.from_numpy(self.atype.reshape(1, -1)).to(device=PT_EXPT_DEVICE),
+                gr=torch.from_numpy(self.gr).to(device=PT_EXPT_DEVICE),
+            )["dipole"]
+            .detach()
+            .cpu()
+            .numpy()
+        )
+
     def eval_dp(self, dp_obj: Any) -> Any:
         (
             resnet_dt,
diff --git a/source/tests/consistent/fitting/test_dos.py b/source/tests/consistent/fitting/test_dos.py
index a77bc28c17..f758c9d317 100644
--- a/source/tests/consistent/fitting/test_dos.py
+++ b/source/tests/consistent/fitting/test_dos.py
@@ -18,6 +18,7 @@
     INSTALLED_ARRAY_API_STRICT,
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
     parameterized,
@@ -33,6 +34,11 @@
     from deepmd.pt.utils.env import DEVICE as PT_DEVICE
 else:
     DOSFittingPT = object
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.fitting.dos_fitting import DOSFittingNet as DOSFittingPTExpt
+    from deepmd.pt_expt.utils.env import DEVICE as PT_EXPT_DEVICE
+else:
+    DOSFittingPTExpt = None
 if INSTALLED_TF:
     from deepmd.tf.fit.dos import DOSFitting as DOSFittingTF
 else:
@@ -106,9 +112,14 @@ def skip_jax(self) -> bool:
     def skip_array_api_strict(self) -> bool:
         return not INSTALLED_ARRAY_API_STRICT
 
+    @property
+    def skip_pt_expt(self) -> bool:
+        return CommonTest.skip_pt_expt
+
     tf_class = DOSFittingTF
     dp_class = DOSFittingDP
     pt_class = DOSFittingPT
+    pt_expt_class = DOSFittingPTExpt
     jax_class = DOSFittingJAX
     array_api_strict_class = DOSFittingStrict
     args = fitting_dos()
@@ -187,6 +198,31 @@ def eval_pt(self, pt_obj: Any) -> Any:
             .numpy()
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        (
+            resnet_dt,
+            precision,
+            mixed_types,
+            numb_fparam,
+            numb_aparam,
+            numb_dos,
+        ) = self.param
+        return (
+            pt_expt_obj(
+                torch.from_numpy(self.inputs).to(device=PT_EXPT_DEVICE),
+                torch.from_numpy(self.atype.reshape(1, -1)).to(device=PT_EXPT_DEVICE),
+                fparam=torch.from_numpy(self.fparam).to(device=PT_EXPT_DEVICE)
+                if numb_fparam
+                else None,
+                aparam=torch.from_numpy(self.aparam).to(device=PT_EXPT_DEVICE)
+                if numb_aparam
+                else None,
+            )["dos"]
+            .detach()
+            .cpu()
+            .numpy()
+        )
+
     def eval_dp(self, dp_obj: Any) -> Any:
         (
             resnet_dt,
diff --git a/source/tests/consistent/fitting/test_polar.py b/source/tests/consistent/fitting/test_polar.py
index a52beea0c7..142cbefdc8 100644
--- a/source/tests/consistent/fitting/test_polar.py
+++ b/source/tests/consistent/fitting/test_polar.py
@@ -18,6 +18,7 @@
     INSTALLED_ARRAY_API_STRICT,
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
     parameterized,
@@ -33,6 +34,13 @@
     from deepmd.pt.utils.env import DEVICE as PT_DEVICE
 else:
     PolarFittingPT = object
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.fitting.polarizability_fitting import (
+        PolarFitting as PolarFittingPTExpt,
+    )
+    from deepmd.pt_expt.utils.env import DEVICE as PT_EXPT_DEVICE
+else:
+    PolarFittingPTExpt = None
 if INSTALLED_TF:
     from deepmd.tf.fit.polar import PolarFittingSeA as PolarFittingTF
 else:
@@ -90,12 +98,17 @@ def skip_pt(self) -> bool:
     tf_class = PolarFittingTF
     dp_class = PolarFittingDP
     pt_class = PolarFittingPT
+    pt_expt_class = PolarFittingPTExpt
     jax_class = PolarFittingJAX
     array_api_strict_class = PolarFittingArrayAPIStrict
     args = fitting_polar()
     skip_jax = not INSTALLED_JAX
     skip_array_api_strict = not INSTALLED_ARRAY_API_STRICT
 
+    @property
+    def skip_pt_expt(self) -> bool:
+        return CommonTest.skip_pt_expt
+
     def setUp(self) -> None:
         CommonTest.setUp(self)
 
@@ -155,6 +168,18 @@ def eval_pt(self, pt_obj: Any) -> Any:
             .numpy()
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return (
+            pt_expt_obj(
+                torch.from_numpy(self.inputs).to(device=PT_EXPT_DEVICE),
+                torch.from_numpy(self.atype.reshape(1, -1)).to(device=PT_EXPT_DEVICE),
+                gr=torch.from_numpy(self.gr).to(device=PT_EXPT_DEVICE),
+            )["polarizability"]
+            .detach()
+            .cpu()
+            .numpy()
+        )
+
     def eval_dp(self, dp_obj: Any) -> Any:
         (
             resnet_dt,
diff --git a/source/tests/consistent/fitting/test_property.py b/source/tests/consistent/fitting/test_property.py
index bccd20bd54..a9da348410 100644
--- a/source/tests/consistent/fitting/test_property.py
+++ b/source/tests/consistent/fitting/test_property.py
@@ -23,6 +23,7 @@
     INSTALLED_ARRAY_API_STRICT,
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     CommonTest,
     parameterized,
 )
@@ -37,6 +38,13 @@
     from deepmd.pt.utils.env import DEVICE as PT_DEVICE
 else:
     PropertyFittingPT = object
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.fitting.property_fitting import (
+        PropertyFittingNet as PropertyFittingPTExpt,
+    )
+    from deepmd.pt_expt.utils.env import DEVICE as PT_EXPT_DEVICE
+else:
+    PropertyFittingPTExpt = None
 if INSTALLED_JAX:
     from deepmd.jax.env import (
         jnp,
@@ -110,9 +118,14 @@ def skip_tf(self) -> bool:
     skip_jax = not INSTALLED_JAX
     skip_array_api_strict = not INSTALLED_ARRAY_API_STRICT
 
+    @property
+    def skip_pt_expt(self) -> bool:
+        return CommonTest.skip_pt_expt
+
     tf_class = PropertyFittingTF
     dp_class = PropertyFittingDP
     pt_class = PropertyFittingPT
+    pt_expt_class = PropertyFittingPTExpt
     jax_class = PropertyFittingJAX
     array_api_strict_class = PropertyFittingStrict
     args = fitting_property()
@@ -194,6 +207,32 @@ def eval_pt(self, pt_obj: Any) -> Any:
             .numpy()
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        (
+            resnet_dt,
+            precision,
+            mixed_types,
+            numb_fparam,
+            numb_aparam,
+            task_dim,
+            intensive,
+        ) = self.param
+        return (
+            pt_expt_obj(
+                torch.from_numpy(self.inputs).to(device=PT_EXPT_DEVICE),
+                torch.from_numpy(self.atype.reshape(1, -1)).to(device=PT_EXPT_DEVICE),
+                fparam=torch.from_numpy(self.fparam).to(device=PT_EXPT_DEVICE)
+                if numb_fparam
+                else None,
+                aparam=torch.from_numpy(self.aparam).to(device=PT_EXPT_DEVICE)
+                if numb_aparam
+                else None,
+            )[pt_expt_obj.var_name]
+            .detach()
+            .cpu()
+            .numpy()
+        )
+
     def eval_dp(self, dp_obj: Any) -> Any:
         (
             resnet_dt,
diff --git a/source/tests/pt_expt/fitting/test_dipole_fitting.py b/source/tests/pt_expt/fitting/test_dipole_fitting.py
new file mode 100644
index 0000000000..8d25b55075
--- /dev/null
+++ b/source/tests/pt_expt/fitting/test_dipole_fitting.py
@@ -0,0 +1,128 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.pt_expt.fitting import (
+    DipoleFitting,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...pt.model.test_env_mat import (
+    TestCaseSingleFrameWithNlist,
+)
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestDipoleFitting(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.device = env.DEVICE
+
+    def test_self_consistency(self) -> None:
+        rng = np.random.default_rng(GLOBAL_SEED)
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        atype = self.atype_ext[:, :nloc]
+
+        # dd[0]: descriptor, dd[1]: gr (rotation matrix, nf x nloc x nnei x 3... but
+        # for se_a, gr shape is nf x nloc x m1 x 3)
+        embedding_width = ds.get_dim_emb()
+
+        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
+            fn0 = DipoleFitting(
+                self.nt,
+                ds.dim_out,
+                embedding_width,
+                numb_fparam=nfp,
+                numb_aparam=nap,
+            ).to(self.device)
+            fn1 = DipoleFitting.deserialize(fn0.serialize()).to(self.device)
+            if nfp > 0:
+                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+            else:
+                ifp = None
+            if nap > 0:
+                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                    self.device
+                )
+            else:
+                iap = None
+            ret0 = fn0(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                gr=torch.from_numpy(dd[1]).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            ret1 = fn1(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                gr=torch.from_numpy(dd[1]).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            np.testing.assert_allclose(
+                ret0["dipole"].detach().cpu().numpy(),
+                ret1["dipole"].detach().cpu().numpy(),
+            )
+
+    def test_serialize_has_correct_type(self) -> None:
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        embedding_width = ds.get_dim_emb()
+        fn = DipoleFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+        ).to(self.device)
+        serialized = fn.serialize()
+        self.assertEqual(serialized["type"], "dipole")
+        fn2 = DipoleFitting.deserialize(serialized).to(self.device)
+        self.assertIsInstance(fn2, DipoleFitting)
+
+    def test_torch_export_simple(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        embedding_width = ds.get_dim_emb()
+        rng = np.random.default_rng(GLOBAL_SEED)
+
+        fn = DipoleFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+            numb_fparam=0,
+            numb_aparam=0,
+        ).to(self.device)
+
+        descriptor = torch.from_numpy(dd[0]).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+        gr = torch.from_numpy(dd[1]).to(self.device)
+
+        ret = fn(descriptor, atype, gr=gr)
+        self.assertIn("dipole", ret)
+
+        exported = torch.export.export(
+            fn,
+            (descriptor, atype),
+            kwargs={"gr": gr},
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_exported = exported.module()(descriptor, atype, gr=gr)
+        np.testing.assert_allclose(
+            ret["dipole"].detach().cpu().numpy(),
+            ret_exported["dipole"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_dos_fitting.py b/source/tests/pt_expt/fitting/test_dos_fitting.py
new file mode 100644
index 0000000000..e16b6f6569
--- /dev/null
+++ b/source/tests/pt_expt/fitting/test_dos_fitting.py
@@ -0,0 +1,120 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.pt_expt.fitting import (
+    DOSFittingNet,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...pt.model.test_env_mat import (
+    TestCaseSingleFrameWithNlist,
+)
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestDOSFittingNet(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.device = env.DEVICE
+
+    def test_self_consistency(self) -> None:
+        rng = np.random.default_rng(GLOBAL_SEED)
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        atype = self.atype_ext[:, :nloc]
+
+        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
+            fn0 = DOSFittingNet(
+                self.nt,
+                ds.dim_out,
+                numb_dos=10,
+                numb_fparam=nfp,
+                numb_aparam=nap,
+            ).to(self.device)
+            fn1 = DOSFittingNet.deserialize(fn0.serialize()).to(self.device)
+            if nfp > 0:
+                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+            else:
+                ifp = None
+            if nap > 0:
+                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                    self.device
+                )
+            else:
+                iap = None
+            ret0 = fn0(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            ret1 = fn1(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            np.testing.assert_allclose(
+                ret0["dos"].detach().cpu().numpy(),
+                ret1["dos"].detach().cpu().numpy(),
+            )
+
+    def test_serialize_has_correct_type(self) -> None:
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        fn = DOSFittingNet(
+            self.nt,
+            ds.dim_out,
+            numb_dos=10,
+        ).to(self.device)
+        serialized = fn.serialize()
+        self.assertEqual(serialized["type"], "dos")
+        fn2 = DOSFittingNet.deserialize(serialized).to(self.device)
+        self.assertIsInstance(fn2, DOSFittingNet)
+
+    def test_torch_export_simple(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        rng = np.random.default_rng(GLOBAL_SEED)
+
+        fn = DOSFittingNet(
+            self.nt,
+            ds.dim_out,
+            numb_dos=10,
+            numb_fparam=0,
+            numb_aparam=0,
+        ).to(self.device)
+
+        descriptor = torch.from_numpy(
+            rng.standard_normal((self.nf, self.nloc, ds.dim_out))
+        ).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+
+        ret = fn(descriptor, atype)
+        self.assertIn("dos", ret)
+
+        exported = torch.export.export(
+            fn,
+            (descriptor, atype),
+            kwargs={},
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_exported = exported.module()(descriptor, atype)
+        np.testing.assert_allclose(
+            ret["dos"].detach().cpu().numpy(),
+            ret_exported["dos"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_fitting_ener_fitting.py b/source/tests/pt_expt/fitting/test_ener_fitting.py
similarity index 100%
rename from source/tests/pt_expt/fitting/test_fitting_ener_fitting.py
rename to source/tests/pt_expt/fitting/test_ener_fitting.py
diff --git a/source/tests/pt_expt/fitting/test_fitting_invar_fitting.py b/source/tests/pt_expt/fitting/test_invar_fitting.py
similarity index 100%
rename from source/tests/pt_expt/fitting/test_fitting_invar_fitting.py
rename to source/tests/pt_expt/fitting/test_invar_fitting.py
diff --git a/source/tests/pt_expt/fitting/test_polar_fitting.py b/source/tests/pt_expt/fitting/test_polar_fitting.py
new file mode 100644
index 0000000000..24b38b1fe9
--- /dev/null
+++ b/source/tests/pt_expt/fitting/test_polar_fitting.py
@@ -0,0 +1,125 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.pt_expt.fitting import (
+    PolarFitting,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...pt.model.test_env_mat import (
+    TestCaseSingleFrameWithNlist,
+)
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestPolarFitting(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.device = env.DEVICE
+
+    def test_self_consistency(self) -> None:
+        rng = np.random.default_rng(GLOBAL_SEED)
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        atype = self.atype_ext[:, :nloc]
+
+        embedding_width = ds.get_dim_emb()
+
+        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
+            fn0 = PolarFitting(
+                self.nt,
+                ds.dim_out,
+                embedding_width,
+                numb_fparam=nfp,
+                numb_aparam=nap,
+            ).to(self.device)
+            fn1 = PolarFitting.deserialize(fn0.serialize()).to(self.device)
+            if nfp > 0:
+                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+            else:
+                ifp = None
+            if nap > 0:
+                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                    self.device
+                )
+            else:
+                iap = None
+            ret0 = fn0(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                gr=torch.from_numpy(dd[1]).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            ret1 = fn1(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                gr=torch.from_numpy(dd[1]).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            np.testing.assert_allclose(
+                ret0["polarizability"].detach().cpu().numpy(),
+                ret1["polarizability"].detach().cpu().numpy(),
+            )
+
+    def test_serialize_has_correct_type(self) -> None:
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        embedding_width = ds.get_dim_emb()
+        fn = PolarFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+        ).to(self.device)
+        serialized = fn.serialize()
+        self.assertEqual(serialized["type"], "polar")
+        fn2 = PolarFitting.deserialize(serialized).to(self.device)
+        self.assertIsInstance(fn2, PolarFitting)
+
+    def test_torch_export_simple(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        embedding_width = ds.get_dim_emb()
+
+        fn = PolarFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+            numb_fparam=0,
+            numb_aparam=0,
+        ).to(self.device)
+
+        descriptor = torch.from_numpy(dd[0]).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+        gr = torch.from_numpy(dd[1]).to(self.device)
+
+        ret = fn(descriptor, atype, gr=gr)
+        self.assertIn("polarizability", ret)
+
+        exported = torch.export.export(
+            fn,
+            (descriptor, atype),
+            kwargs={"gr": gr},
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_exported = exported.module()(descriptor, atype, gr=gr)
+        np.testing.assert_allclose(
+            ret["polarizability"].detach().cpu().numpy(),
+            ret_exported["polarizability"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_property_fitting.py b/source/tests/pt_expt/fitting/test_property_fitting.py
new file mode 100644
index 0000000000..44a499ed9d
--- /dev/null
+++ b/source/tests/pt_expt/fitting/test_property_fitting.py
@@ -0,0 +1,120 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.pt_expt.fitting import (
+    PropertyFittingNet,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...pt.model.test_env_mat import (
+    TestCaseSingleFrameWithNlist,
+)
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestPropertyFittingNet(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.device = env.DEVICE
+
+    def test_self_consistency(self) -> None:
+        rng = np.random.default_rng(GLOBAL_SEED)
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        atype = self.atype_ext[:, :nloc]
+
+        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
+            fn0 = PropertyFittingNet(
+                self.nt,
+                ds.dim_out,
+                task_dim=3,
+                numb_fparam=nfp,
+                numb_aparam=nap,
+            ).to(self.device)
+            fn1 = PropertyFittingNet.deserialize(fn0.serialize()).to(self.device)
+            if nfp > 0:
+                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+            else:
+                ifp = None
+            if nap > 0:
+                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                    self.device
+                )
+            else:
+                iap = None
+            ret0 = fn0(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            ret1 = fn1(
+                torch.from_numpy(dd[0]).to(self.device),
+                torch.from_numpy(atype).to(self.device),
+                fparam=ifp,
+                aparam=iap,
+            )
+            np.testing.assert_allclose(
+                ret0["property"].detach().cpu().numpy(),
+                ret1["property"].detach().cpu().numpy(),
+            )
+
+    def test_serialize_has_correct_type(self) -> None:
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        fn = PropertyFittingNet(
+            self.nt,
+            ds.dim_out,
+            task_dim=3,
+        ).to(self.device)
+        serialized = fn.serialize()
+        self.assertEqual(serialized["type"], "property")
+        fn2 = PropertyFittingNet.deserialize(serialized).to(self.device)
+        self.assertIsInstance(fn2, PropertyFittingNet)
+
+    def test_torch_export_simple(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        rng = np.random.default_rng(GLOBAL_SEED)
+
+        fn = PropertyFittingNet(
+            self.nt,
+            ds.dim_out,
+            task_dim=3,
+            numb_fparam=0,
+            numb_aparam=0,
+        ).to(self.device)
+
+        descriptor = torch.from_numpy(
+            rng.standard_normal((self.nf, self.nloc, ds.dim_out))
+        ).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+
+        ret = fn(descriptor, atype)
+        self.assertIn("property", ret)
+
+        exported = torch.export.export(
+            fn,
+            (descriptor, atype),
+            kwargs={},
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_exported = exported.module()(descriptor, atype)
+        np.testing.assert_allclose(
+            ret["property"].detach().cpu().numpy(),
+            ret_exported["property"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )

From 292fa724576af4cfed07a7b2bb1975e8fa2cf3f6 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 17:03:28 +0800
Subject: [PATCH 02/63] add make_fx, mv itertools to parameterized

---
 .../pt_expt/fitting/test_dipole_fitting.py    | 139 ++++++++++++------
 .../tests/pt_expt/fitting/test_dos_fitting.py | 131 +++++++++++------
 .../pt_expt/fitting/test_polar_fitting.py     | 136 +++++++++++------
 .../pt_expt/fitting/test_property_fitting.py  | 131 +++++++++++------
 4 files changed, 360 insertions(+), 177 deletions(-)

diff --git a/source/tests/pt_expt/fitting/test_dipole_fitting.py b/source/tests/pt_expt/fitting/test_dipole_fitting.py
index 8d25b55075..f5ac7ba177 100644
--- a/source/tests/pt_expt/fitting/test_dipole_fitting.py
+++ b/source/tests/pt_expt/fitting/test_dipole_fitting.py
@@ -1,8 +1,11 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-import unittest
 
 import numpy as np
+import pytest
 import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
 
 from deepmd.dpmodel.descriptor import (
     DescrptSeA,
@@ -22,59 +25,57 @@
 )
 
 
-class TestDipoleFitting(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def setUp(self) -> None:
+class TestDipoleFitting(TestCaseSingleFrameWithNlist):
+    def setup_method(self) -> None:
         TestCaseSingleFrameWithNlist.setUp(self)
         self.device = env.DEVICE
 
-    def test_self_consistency(self) -> None:
+    @pytest.mark.parametrize("nfp", [0, 3])  # numb_fparam
+    @pytest.mark.parametrize("nap", [0, 4])  # numb_aparam
+    def test_self_consistency(self, nfp, nap) -> None:
         rng = np.random.default_rng(GLOBAL_SEED)
         nf, nloc, nnei = self.nlist.shape
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
         dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
         atype = self.atype_ext[:, :nloc]
-
-        # dd[0]: descriptor, dd[1]: gr (rotation matrix, nf x nloc x nnei x 3... but
-        # for se_a, gr shape is nf x nloc x m1 x 3)
         embedding_width = ds.get_dim_emb()
 
-        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
-            fn0 = DipoleFitting(
-                self.nt,
-                ds.dim_out,
-                embedding_width,
-                numb_fparam=nfp,
-                numb_aparam=nap,
-            ).to(self.device)
-            fn1 = DipoleFitting.deserialize(fn0.serialize()).to(self.device)
-            if nfp > 0:
-                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
-            else:
-                ifp = None
-            if nap > 0:
-                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
-                    self.device
-                )
-            else:
-                iap = None
-            ret0 = fn0(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                gr=torch.from_numpy(dd[1]).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            ret1 = fn1(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                gr=torch.from_numpy(dd[1]).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            np.testing.assert_allclose(
-                ret0["dipole"].detach().cpu().numpy(),
-                ret1["dipole"].detach().cpu().numpy(),
+        fn0 = DipoleFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+            numb_fparam=nfp,
+            numb_aparam=nap,
+        ).to(self.device)
+        fn1 = DipoleFitting.deserialize(fn0.serialize()).to(self.device)
+        if nfp > 0:
+            ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+        else:
+            ifp = None
+        if nap > 0:
+            iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                self.device
             )
+        else:
+            iap = None
+        ret0 = fn0(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            gr=torch.from_numpy(dd[1]).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        ret1 = fn1(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            gr=torch.from_numpy(dd[1]).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        np.testing.assert_allclose(
+            ret0["dipole"].detach().cpu().numpy(),
+            ret1["dipole"].detach().cpu().numpy(),
+        )
 
     def test_serialize_has_correct_type(self) -> None:
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
@@ -85,16 +86,15 @@ def test_serialize_has_correct_type(self) -> None:
             embedding_width,
         ).to(self.device)
         serialized = fn.serialize()
-        self.assertEqual(serialized["type"], "dipole")
+        assert serialized["type"] == "dipole"
         fn2 = DipoleFitting.deserialize(serialized).to(self.device)
-        self.assertIsInstance(fn2, DipoleFitting)
+        assert isinstance(fn2, DipoleFitting)
 
     def test_torch_export_simple(self) -> None:
         nf, nloc, nnei = self.nlist.shape
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
         dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
         embedding_width = ds.get_dim_emb()
-        rng = np.random.default_rng(GLOBAL_SEED)
 
         fn = DipoleFitting(
             self.nt,
@@ -109,7 +109,7 @@ def test_torch_export_simple(self) -> None:
         gr = torch.from_numpy(dd[1]).to(self.device)
 
         ret = fn(descriptor, atype, gr=gr)
-        self.assertIn("dipole", ret)
+        assert "dipole" in ret
 
         exported = torch.export.export(
             fn,
@@ -117,7 +117,7 @@ def test_torch_export_simple(self) -> None:
             kwargs={"gr": gr},
             strict=False,
         )
-        self.assertIsNotNone(exported)
+        assert exported is not None
 
         ret_exported = exported.module()(descriptor, atype, gr=gr)
         np.testing.assert_allclose(
@@ -126,3 +126,46 @@ def test_torch_export_simple(self) -> None:
             rtol=1e-10,
             atol=1e-10,
         )
+
+    def test_make_fx(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        embedding_width = ds.get_dim_emb()
+
+        fn0 = (
+            DipoleFitting(
+                self.nt,
+                ds.dim_out,
+                embedding_width,
+                precision="float64",
+            )
+            .to(self.device)
+            .eval()
+        )
+
+        descriptor = torch.from_numpy(dd[0]).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+        gr = torch.from_numpy(dd[1]).to(self.device)
+
+        def fn(descriptor, atype, gr):
+            descriptor = descriptor.detach().requires_grad_(True)
+            ret = fn0(descriptor, atype, gr=gr)["dipole"]
+            grad = torch.autograd.grad(ret.sum(), descriptor, create_graph=False)[0]
+            return ret, grad
+
+        ret_eager, grad_eager = fn(descriptor, atype, gr)
+        traced = make_fx(fn)(descriptor, atype, gr)
+        ret_traced, grad_traced = traced(descriptor, atype, gr)
+        np.testing.assert_allclose(
+            ret_eager.detach().cpu().numpy(),
+            ret_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            grad_eager.detach().cpu().numpy(),
+            grad_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_dos_fitting.py b/source/tests/pt_expt/fitting/test_dos_fitting.py
index e16b6f6569..3fe06a8618 100644
--- a/source/tests/pt_expt/fitting/test_dos_fitting.py
+++ b/source/tests/pt_expt/fitting/test_dos_fitting.py
@@ -1,8 +1,11 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-import unittest
 
 import numpy as np
+import pytest
 import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
 
 from deepmd.dpmodel.descriptor import (
     DescrptSeA,
@@ -22,53 +25,54 @@
 )
 
 
-class TestDOSFittingNet(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def setUp(self) -> None:
+class TestDOSFittingNet(TestCaseSingleFrameWithNlist):
+    def setup_method(self) -> None:
         TestCaseSingleFrameWithNlist.setUp(self)
         self.device = env.DEVICE
 
-    def test_self_consistency(self) -> None:
+    @pytest.mark.parametrize("nfp", [0, 3])  # numb_fparam
+    @pytest.mark.parametrize("nap", [0, 4])  # numb_aparam
+    def test_self_consistency(self, nfp, nap) -> None:
         rng = np.random.default_rng(GLOBAL_SEED)
         nf, nloc, nnei = self.nlist.shape
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
         dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
         atype = self.atype_ext[:, :nloc]
 
-        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
-            fn0 = DOSFittingNet(
-                self.nt,
-                ds.dim_out,
-                numb_dos=10,
-                numb_fparam=nfp,
-                numb_aparam=nap,
-            ).to(self.device)
-            fn1 = DOSFittingNet.deserialize(fn0.serialize()).to(self.device)
-            if nfp > 0:
-                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
-            else:
-                ifp = None
-            if nap > 0:
-                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
-                    self.device
-                )
-            else:
-                iap = None
-            ret0 = fn0(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            ret1 = fn1(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            np.testing.assert_allclose(
-                ret0["dos"].detach().cpu().numpy(),
-                ret1["dos"].detach().cpu().numpy(),
+        fn0 = DOSFittingNet(
+            self.nt,
+            ds.dim_out,
+            numb_dos=10,
+            numb_fparam=nfp,
+            numb_aparam=nap,
+        ).to(self.device)
+        fn1 = DOSFittingNet.deserialize(fn0.serialize()).to(self.device)
+        if nfp > 0:
+            ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+        else:
+            ifp = None
+        if nap > 0:
+            iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                self.device
             )
+        else:
+            iap = None
+        ret0 = fn0(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        ret1 = fn1(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        np.testing.assert_allclose(
+            ret0["dos"].detach().cpu().numpy(),
+            ret1["dos"].detach().cpu().numpy(),
+        )
 
     def test_serialize_has_correct_type(self) -> None:
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
@@ -78,9 +82,9 @@ def test_serialize_has_correct_type(self) -> None:
             numb_dos=10,
         ).to(self.device)
         serialized = fn.serialize()
-        self.assertEqual(serialized["type"], "dos")
+        assert serialized["type"] == "dos"
         fn2 = DOSFittingNet.deserialize(serialized).to(self.device)
-        self.assertIsInstance(fn2, DOSFittingNet)
+        assert isinstance(fn2, DOSFittingNet)
 
     def test_torch_export_simple(self) -> None:
         nf, nloc, nnei = self.nlist.shape
@@ -101,7 +105,7 @@ def test_torch_export_simple(self) -> None:
         atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
 
         ret = fn(descriptor, atype)
-        self.assertIn("dos", ret)
+        assert "dos" in ret
 
         exported = torch.export.export(
             fn,
@@ -109,7 +113,7 @@ def test_torch_export_simple(self) -> None:
             kwargs={},
             strict=False,
         )
-        self.assertIsNotNone(exported)
+        assert exported is not None
 
         ret_exported = exported.module()(descriptor, atype)
         np.testing.assert_allclose(
@@ -118,3 +122,46 @@ def test_torch_export_simple(self) -> None:
             rtol=1e-10,
             atol=1e-10,
         )
+
+    def test_make_fx(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        rng = np.random.default_rng(GLOBAL_SEED)
+
+        fn0 = (
+            DOSFittingNet(
+                self.nt,
+                ds.dim_out,
+                numb_dos=10,
+                precision="float64",
+            )
+            .to(self.device)
+            .eval()
+        )
+
+        descriptor = torch.from_numpy(
+            rng.standard_normal((self.nf, self.nloc, ds.dim_out))
+        ).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+
+        def fn(descriptor, atype):
+            descriptor = descriptor.detach().requires_grad_(True)
+            ret = fn0(descriptor, atype)["dos"]
+            grad = torch.autograd.grad(ret.sum(), descriptor, create_graph=False)[0]
+            return ret, grad
+
+        ret_eager, grad_eager = fn(descriptor, atype)
+        traced = make_fx(fn)(descriptor, atype)
+        ret_traced, grad_traced = traced(descriptor, atype)
+        np.testing.assert_allclose(
+            ret_eager.detach().cpu().numpy(),
+            ret_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            grad_eager.detach().cpu().numpy(),
+            grad_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_polar_fitting.py b/source/tests/pt_expt/fitting/test_polar_fitting.py
index 24b38b1fe9..1c150f7154 100644
--- a/source/tests/pt_expt/fitting/test_polar_fitting.py
+++ b/source/tests/pt_expt/fitting/test_polar_fitting.py
@@ -1,8 +1,11 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-import unittest
 
 import numpy as np
+import pytest
 import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
 
 from deepmd.dpmodel.descriptor import (
     DescrptSeA,
@@ -22,57 +25,57 @@
 )
 
 
-class TestPolarFitting(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def setUp(self) -> None:
+class TestPolarFitting(TestCaseSingleFrameWithNlist):
+    def setup_method(self) -> None:
         TestCaseSingleFrameWithNlist.setUp(self)
         self.device = env.DEVICE
 
-    def test_self_consistency(self) -> None:
+    @pytest.mark.parametrize("nfp", [0, 3])  # numb_fparam
+    @pytest.mark.parametrize("nap", [0, 4])  # numb_aparam
+    def test_self_consistency(self, nfp, nap) -> None:
         rng = np.random.default_rng(GLOBAL_SEED)
         nf, nloc, nnei = self.nlist.shape
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
         dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
         atype = self.atype_ext[:, :nloc]
-
         embedding_width = ds.get_dim_emb()
 
-        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
-            fn0 = PolarFitting(
-                self.nt,
-                ds.dim_out,
-                embedding_width,
-                numb_fparam=nfp,
-                numb_aparam=nap,
-            ).to(self.device)
-            fn1 = PolarFitting.deserialize(fn0.serialize()).to(self.device)
-            if nfp > 0:
-                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
-            else:
-                ifp = None
-            if nap > 0:
-                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
-                    self.device
-                )
-            else:
-                iap = None
-            ret0 = fn0(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                gr=torch.from_numpy(dd[1]).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            ret1 = fn1(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                gr=torch.from_numpy(dd[1]).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            np.testing.assert_allclose(
-                ret0["polarizability"].detach().cpu().numpy(),
-                ret1["polarizability"].detach().cpu().numpy(),
+        fn0 = PolarFitting(
+            self.nt,
+            ds.dim_out,
+            embedding_width,
+            numb_fparam=nfp,
+            numb_aparam=nap,
+        ).to(self.device)
+        fn1 = PolarFitting.deserialize(fn0.serialize()).to(self.device)
+        if nfp > 0:
+            ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+        else:
+            ifp = None
+        if nap > 0:
+            iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                self.device
             )
+        else:
+            iap = None
+        ret0 = fn0(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            gr=torch.from_numpy(dd[1]).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        ret1 = fn1(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            gr=torch.from_numpy(dd[1]).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        np.testing.assert_allclose(
+            ret0["polarizability"].detach().cpu().numpy(),
+            ret1["polarizability"].detach().cpu().numpy(),
+        )
 
     def test_serialize_has_correct_type(self) -> None:
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
@@ -83,9 +86,9 @@ def test_serialize_has_correct_type(self) -> None:
             embedding_width,
         ).to(self.device)
         serialized = fn.serialize()
-        self.assertEqual(serialized["type"], "polar")
+        assert serialized["type"] == "polar"
         fn2 = PolarFitting.deserialize(serialized).to(self.device)
-        self.assertIsInstance(fn2, PolarFitting)
+        assert isinstance(fn2, PolarFitting)
 
     def test_torch_export_simple(self) -> None:
         nf, nloc, nnei = self.nlist.shape
@@ -106,7 +109,7 @@ def test_torch_export_simple(self) -> None:
         gr = torch.from_numpy(dd[1]).to(self.device)
 
         ret = fn(descriptor, atype, gr=gr)
-        self.assertIn("polarizability", ret)
+        assert "polarizability" in ret
 
         exported = torch.export.export(
             fn,
@@ -114,7 +117,7 @@ def test_torch_export_simple(self) -> None:
             kwargs={"gr": gr},
             strict=False,
         )
-        self.assertIsNotNone(exported)
+        assert exported is not None
 
         ret_exported = exported.module()(descriptor, atype, gr=gr)
         np.testing.assert_allclose(
@@ -123,3 +126,46 @@ def test_torch_export_simple(self) -> None:
             rtol=1e-10,
             atol=1e-10,
         )
+
+    def test_make_fx(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
+        embedding_width = ds.get_dim_emb()
+
+        fn0 = (
+            PolarFitting(
+                self.nt,
+                ds.dim_out,
+                embedding_width,
+                precision="float64",
+            )
+            .to(self.device)
+            .eval()
+        )
+
+        descriptor = torch.from_numpy(dd[0]).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+        gr = torch.from_numpy(dd[1]).to(self.device)
+
+        def fn(descriptor, atype, gr):
+            descriptor = descriptor.detach().requires_grad_(True)
+            ret = fn0(descriptor, atype, gr=gr)["polarizability"]
+            grad = torch.autograd.grad(ret.sum(), descriptor, create_graph=False)[0]
+            return ret, grad
+
+        ret_eager, grad_eager = fn(descriptor, atype, gr)
+        traced = make_fx(fn)(descriptor, atype, gr)
+        ret_traced, grad_traced = traced(descriptor, atype, gr)
+        np.testing.assert_allclose(
+            ret_eager.detach().cpu().numpy(),
+            ret_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            grad_eager.detach().cpu().numpy(),
+            grad_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
diff --git a/source/tests/pt_expt/fitting/test_property_fitting.py b/source/tests/pt_expt/fitting/test_property_fitting.py
index 44a499ed9d..ca3dbc11af 100644
--- a/source/tests/pt_expt/fitting/test_property_fitting.py
+++ b/source/tests/pt_expt/fitting/test_property_fitting.py
@@ -1,8 +1,11 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-import unittest
 
 import numpy as np
+import pytest
 import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
 
 from deepmd.dpmodel.descriptor import (
     DescrptSeA,
@@ -22,53 +25,54 @@
 )
 
 
-class TestPropertyFittingNet(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def setUp(self) -> None:
+class TestPropertyFittingNet(TestCaseSingleFrameWithNlist):
+    def setup_method(self) -> None:
         TestCaseSingleFrameWithNlist.setUp(self)
         self.device = env.DEVICE
 
-    def test_self_consistency(self) -> None:
+    @pytest.mark.parametrize("nfp", [0, 3])  # numb_fparam
+    @pytest.mark.parametrize("nap", [0, 4])  # numb_aparam
+    def test_self_consistency(self, nfp, nap) -> None:
         rng = np.random.default_rng(GLOBAL_SEED)
         nf, nloc, nnei = self.nlist.shape
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
         dd = ds.call(self.coord_ext, self.atype_ext, self.nlist)
         atype = self.atype_ext[:, :nloc]
 
-        for nfp, nap in [(0, 0), (3, 0), (0, 4), (3, 4)]:
-            fn0 = PropertyFittingNet(
-                self.nt,
-                ds.dim_out,
-                task_dim=3,
-                numb_fparam=nfp,
-                numb_aparam=nap,
-            ).to(self.device)
-            fn1 = PropertyFittingNet.deserialize(fn0.serialize()).to(self.device)
-            if nfp > 0:
-                ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
-            else:
-                ifp = None
-            if nap > 0:
-                iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
-                    self.device
-                )
-            else:
-                iap = None
-            ret0 = fn0(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            ret1 = fn1(
-                torch.from_numpy(dd[0]).to(self.device),
-                torch.from_numpy(atype).to(self.device),
-                fparam=ifp,
-                aparam=iap,
-            )
-            np.testing.assert_allclose(
-                ret0["property"].detach().cpu().numpy(),
-                ret1["property"].detach().cpu().numpy(),
+        fn0 = PropertyFittingNet(
+            self.nt,
+            ds.dim_out,
+            task_dim=3,
+            numb_fparam=nfp,
+            numb_aparam=nap,
+        ).to(self.device)
+        fn1 = PropertyFittingNet.deserialize(fn0.serialize()).to(self.device)
+        if nfp > 0:
+            ifp = torch.from_numpy(rng.normal(size=(self.nf, nfp))).to(self.device)
+        else:
+            ifp = None
+        if nap > 0:
+            iap = torch.from_numpy(rng.normal(size=(self.nf, self.nloc, nap))).to(
+                self.device
             )
+        else:
+            iap = None
+        ret0 = fn0(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        ret1 = fn1(
+            torch.from_numpy(dd[0]).to(self.device),
+            torch.from_numpy(atype).to(self.device),
+            fparam=ifp,
+            aparam=iap,
+        )
+        np.testing.assert_allclose(
+            ret0["property"].detach().cpu().numpy(),
+            ret1["property"].detach().cpu().numpy(),
+        )
 
     def test_serialize_has_correct_type(self) -> None:
         ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
@@ -78,9 +82,9 @@ def test_serialize_has_correct_type(self) -> None:
             task_dim=3,
         ).to(self.device)
         serialized = fn.serialize()
-        self.assertEqual(serialized["type"], "property")
+        assert serialized["type"] == "property"
         fn2 = PropertyFittingNet.deserialize(serialized).to(self.device)
-        self.assertIsInstance(fn2, PropertyFittingNet)
+        assert isinstance(fn2, PropertyFittingNet)
 
     def test_torch_export_simple(self) -> None:
         nf, nloc, nnei = self.nlist.shape
@@ -101,7 +105,7 @@ def test_torch_export_simple(self) -> None:
         atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
 
         ret = fn(descriptor, atype)
-        self.assertIn("property", ret)
+        assert "property" in ret
 
         exported = torch.export.export(
             fn,
@@ -109,7 +113,7 @@ def test_torch_export_simple(self) -> None:
             kwargs={},
             strict=False,
         )
-        self.assertIsNotNone(exported)
+        assert exported is not None
 
         ret_exported = exported.module()(descriptor, atype)
         np.testing.assert_allclose(
@@ -118,3 +122,46 @@ def test_torch_export_simple(self) -> None:
             rtol=1e-10,
             atol=1e-10,
         )
+
+    def test_make_fx(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        rng = np.random.default_rng(GLOBAL_SEED)
+
+        fn0 = (
+            PropertyFittingNet(
+                self.nt,
+                ds.dim_out,
+                task_dim=3,
+                precision="float64",
+            )
+            .to(self.device)
+            .eval()
+        )
+
+        descriptor = torch.from_numpy(
+            rng.standard_normal((self.nf, self.nloc, ds.dim_out))
+        ).to(self.device)
+        atype = torch.from_numpy(self.atype_ext[:, :nloc]).to(self.device)
+
+        def fn(descriptor, atype):
+            descriptor = descriptor.detach().requires_grad_(True)
+            ret = fn0(descriptor, atype)["property"]
+            grad = torch.autograd.grad(ret.sum(), descriptor, create_graph=False)[0]
+            return ret, grad
+
+        ret_eager, grad_eager = fn(descriptor, atype)
+        traced = make_fx(fn)(descriptor, atype)
+        ret_traced, grad_traced = traced(descriptor, atype)
+        np.testing.assert_allclose(
+            ret_eager.detach().cpu().numpy(),
+            ret_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            grad_eager.detach().cpu().numpy(),
+            grad_traced.detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )

From 7289167045ce9c8d02ff8480a29b087c00ea4f33 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 21:31:19 +0800
Subject: [PATCH 03/63] feat(pt_expt): full models dipole, polar, dos, property
 and dp-zbl

---
 .../atomic_model/linear_atomic_model.py       |   2 +-
 .../atomic_model/pairtab_atomic_model.py      |  20 +-
 .../atomic_model/polar_atomic_model.py        |   4 +-
 deepmd/dpmodel/model/make_model.py            |   2 +-
 deepmd/pt_expt/common.py                      |   5 +
 deepmd/pt_expt/model/__init__.py              |  20 ++
 deepmd/pt_expt/model/dipole_model.py          | 151 +++++++++++
 deepmd/pt_expt/model/dos_model.py             | 139 ++++++++++
 deepmd/pt_expt/model/dp_zbl_model.py          | 153 +++++++++++
 deepmd/pt_expt/model/polar_model.py           | 139 ++++++++++
 deepmd/pt_expt/model/property_model.py        | 145 +++++++++++
 source/tests/consistent/model/test_dipole.py  |  21 ++
 source/tests/consistent/model/test_dos.py     |  21 ++
 source/tests/consistent/model/test_dpa1.py    |  21 ++
 source/tests/consistent/model/test_polar.py   |  21 ++
 .../tests/consistent/model/test_property.py   |  27 +-
 .../tests/consistent/model/test_zbl_ener.py   |  21 ++
 .../tests/pt_expt/model/test_dipole_model.py  | 187 ++++++++++++++
 source/tests/pt_expt/model/test_dos_model.py  | 187 ++++++++++++++
 .../tests/pt_expt/model/test_dp_zbl_model.py  | 237 ++++++++++++++++++
 .../tests/pt_expt/model/test_polar_model.py   | 187 ++++++++++++++
 .../pt_expt/model/test_property_model.py      | 190 ++++++++++++++
 22 files changed, 1887 insertions(+), 13 deletions(-)
 create mode 100644 deepmd/pt_expt/model/dipole_model.py
 create mode 100644 deepmd/pt_expt/model/dos_model.py
 create mode 100644 deepmd/pt_expt/model/dp_zbl_model.py
 create mode 100644 deepmd/pt_expt/model/polar_model.py
 create mode 100644 deepmd/pt_expt/model/property_model.py
 create mode 100644 source/tests/pt_expt/model/test_dipole_model.py
 create mode 100644 source/tests/pt_expt/model/test_dos_model.py
 create mode 100644 source/tests/pt_expt/model/test_dp_zbl_model.py
 create mode 100644 source/tests/pt_expt/model/test_polar_model.py
 create mode 100644 source/tests/pt_expt/model/test_property_model.py

diff --git a/deepmd/dpmodel/atomic_model/linear_atomic_model.py b/deepmd/dpmodel/atomic_model/linear_atomic_model.py
index b73dcb77fb..ce54a40333 100644
--- a/deepmd/dpmodel/atomic_model/linear_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/linear_atomic_model.py
@@ -512,4 +512,4 @@ def _compute_weight(
         # to handle masked atoms
         coef = xp.where(sigma != 0, coef, xp.zeros_like(coef))
         self.zbl_weight = coef
-        return [1 - xp.expand_dims(coef, -1), xp.expand_dims(coef, -1)]
+        return [1 - xp.expand_dims(coef, axis=-1), xp.expand_dims(coef, axis=-1)]
diff --git a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
index 6212696ddc..ed063f4727 100644
--- a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
@@ -192,9 +192,11 @@ def deserialize(cls, data: dict) -> "PairTabAtomicModel":
         tab_model = super().deserialize(data)
 
         tab_model.tab = tab
-        tab_model.tab_info = tab_model.tab.tab_info
-        nspline, ntypes = tab_model.tab_info[-2:].astype(int)
-        tab_model.tab_data = tab_model.tab.tab_data.reshape(ntypes, ntypes, nspline, 4)
+        # Extract nspline/ntypes from the numpy source before setting on the
+        # model, because dpmodel_setattr may convert to torch tensor.
+        nspline, ntypes = tab.tab_info[-2:].astype(int)
+        tab_model.tab_info = tab.tab_info
+        tab_model.tab_data = tab.tab_data.reshape(ntypes, ntypes, nspline, 4)
         return tab_model
 
     def forward_atomic(
@@ -281,7 +283,7 @@ def _pair_tabulated_inter(
         hi = 1.0 / hh
 
         # jax jit does not support convert to a Python int, so we need to convert to xp.int64.
-        nspline = (self.tab_info[2] + 0.1).astype(xp.int64)
+        nspline = xp.astype(self.tab_info[2] + 0.1, xp.int64)
 
         uu = (rr - rmin) * hi  # this is broadcasted to (nframes,nloc,nnei)
 
@@ -338,7 +340,7 @@ def _get_pairwise_dist(coords: Array, nlist: Array) -> Array:
         neighbor_atoms = coords[batch_indices, nlist]
         loc_atoms = coords[:, : nlist.shape[1], :]
         pairwise_dr = loc_atoms[:, :, None, :] - neighbor_atoms
-        pairwise_rr = safe_for_sqrt(xp.sum(xp.power(pairwise_dr, 2), axis=-1))
+        pairwise_rr = safe_for_sqrt(xp.sum(pairwise_dr**2, axis=-1))
 
         return pairwise_rr
 
@@ -384,16 +386,18 @@ def _extract_spline_coefficient(
         expanded_idx = xp.broadcast_to(
             idx[..., xp.newaxis, xp.newaxis], (*idx.shape, 1, 4)
         )
-        clipped_indices = xp.clip(expanded_idx, 0, nspline - 1).astype(int)
+        clipped_indices = xp.astype(xp.clip(expanded_idx, 0, nspline - 1), xp.int64)
 
         # (nframes, nloc, nnei, 4)
         final_coef = xp.squeeze(
-            xp_take_along_axis(expanded_tab_data, clipped_indices, 3)
+            xp_take_along_axis(expanded_tab_data, clipped_indices, 3), axis=3
         )
 
         # when the spline idx is beyond the table, all spline coefficients are set to `0`, and the resulting ener corresponding to the idx is also `0`.
         final_coef = xp.where(
-            expanded_idx.squeeze() > nspline, xp.zeros_like(final_coef), final_coef
+            xp.squeeze(expanded_idx, axis=3) > nspline,
+            xp.zeros_like(final_coef),
+            final_coef,
         )
         return final_coef
 
diff --git a/deepmd/dpmodel/atomic_model/polar_atomic_model.py b/deepmd/dpmodel/atomic_model/polar_atomic_model.py
index 2180e48265..fd32f26e5e 100644
--- a/deepmd/dpmodel/atomic_model/polar_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/polar_atomic_model.py
@@ -51,7 +51,7 @@ def apply_out_stat(
             for kk in self.bias_keys:
                 ntypes = out_bias[kk].shape[0]
                 temp = xp.mean(
-                    xp.diagonal(out_bias[kk].reshape(ntypes, 3, 3), axis1=1, axis2=2),
+                    xp.diagonal(out_bias[kk].reshape(ntypes, 3, 3), 0, 1, 2),
                     axis=1,
                 )
                 modified_bias = temp[atype]
@@ -61,7 +61,7 @@ def apply_out_stat(
                     modified_bias[..., xp.newaxis] * (self.fitting.scale[atype])
                 )
 
-                eye = xp.eye(3, dtype=dtype)
+                eye = xp.eye(3, dtype=dtype, device=array_api_compat.device(atype))
                 eye = xp.tile(eye, (nframes, nloc, 1, 1))
                 # (nframes, nloc, 3, 3)
                 modified_bias = modified_bias[..., xp.newaxis] * eye
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index 71169dc64f..37da9cf056 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -555,7 +555,7 @@ def _format_nlist(
                 m_real_nei = nlist >= 0
                 ret = xp.where(m_real_nei, nlist, 0)
                 coord0 = extended_coord[:, :n_nloc, :]
-                index = ret.reshape(n_nf, n_nloc * n_nnei, 1).repeat(3, axis=2)
+                index = xp.tile(ret.reshape(n_nf, n_nloc * n_nnei, 1), (1, 1, 3))
                 coord1 = xp.take_along_axis(extended_coord, index, axis=1)
                 coord1 = coord1.reshape(n_nf, n_nloc, n_nnei, 3)
                 rr = xp.linalg.norm(coord0[:, :, None, :] - coord1, axis=-1)
diff --git a/deepmd/pt_expt/common.py b/deepmd/pt_expt/common.py
index d00e016f6c..d46da28ba8 100644
--- a/deepmd/pt_expt/common.py
+++ b/deepmd/pt_expt/common.py
@@ -297,6 +297,11 @@ def dpmodel_setattr(obj: torch.nn.Module, name: str, value: Any) -> tuple[bool,
         if name in obj._buffers:
             obj._buffers[name] = tensor
             return True, tensor
+        # If the attribute already exists as a regular attribute (e.g. set to
+        # None during __init__ and later reassigned as an ndarray in
+        # deserialize), remove it first so register_buffer doesn't conflict.
+        if hasattr(obj, name) and name not in obj._buffers:
+            delattr(obj, name)
         obj.register_buffer(name, tensor)
         return True, tensor
 
diff --git a/deepmd/pt_expt/model/__init__.py b/deepmd/pt_expt/model/__init__.py
index 5d1c5ffb5d..858bdef6f7 100644
--- a/deepmd/pt_expt/model/__init__.py
+++ b/deepmd/pt_expt/model/__init__.py
@@ -1,8 +1,28 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+from .dipole_model import (
+    DipoleModel,
+)
+from .dos_model import (
+    DOSModel,
+)
+from .dp_zbl_model import (
+    DPZBLModel,
+)
 from .ener_model import (
     EnergyModel,
 )
+from .polar_model import (
+    PolarModel,
+)
+from .property_model import (
+    PropertyModel,
+)
 
 __all__ = [
+    "DOSModel",
+    "DPZBLModel",
+    "DipoleModel",
     "EnergyModel",
+    "PolarModel",
+    "PropertyModel",
 ]
diff --git a/deepmd/pt_expt/model/dipole_model.py b/deepmd/pt_expt/model/dipole_model.py
new file mode 100644
index 0000000000..5839120c72
--- /dev/null
+++ b/deepmd/pt_expt/model/dipole_model.py
@@ -0,0 +1,151 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from typing import (
+    Any,
+)
+
+import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
+
+from deepmd.dpmodel.atomic_model import (
+    DPDipoleAtomicModel,
+)
+from deepmd.dpmodel.model.dp_model import (
+    DPModelCommon,
+)
+
+from .make_model import (
+    make_model,
+)
+
+DPDipoleModel_ = make_model(DPDipoleAtomicModel)
+
+
+class DipoleModel(DPModelCommon, DPDipoleModel_):
+    model_type = "dipole"
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        DPModelCommon.__init__(self)
+        DPDipoleModel_.__init__(self, *args, **kwargs)
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common(
+            coord,
+            atype,
+            box,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["dipole"] = model_ret["dipole"]
+        model_predict["global_dipole"] = model_ret["dipole_redu"]
+        if self.do_grad_r("dipole") and model_ret["dipole_derv_r"] is not None:
+            model_predict["force"] = model_ret["dipole_derv_r"]
+        if self.do_grad_c("dipole") and model_ret["dipole_derv_c_redu"] is not None:
+            model_predict["virial"] = model_ret["dipole_derv_c_redu"]
+            if do_atomic_virial and model_ret["dipole_derv_c"] is not None:
+                model_predict["atom_virial"] = model_ret["dipole_derv_c"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def _forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["dipole"] = model_ret["dipole"]
+        model_predict["global_dipole"] = model_ret["dipole_redu"]
+        if self.do_grad_r("dipole") and model_ret.get("dipole_derv_r") is not None:
+            model_predict["extended_force"] = model_ret["dipole_derv_r"]
+        if self.do_grad_c("dipole") and model_ret.get("dipole_derv_c_redu") is not None:
+            model_predict["virial"] = model_ret["dipole_derv_c_redu"]
+            if do_atomic_virial and model_ret.get("dipole_derv_c") is not None:
+                model_predict["extended_virial"] = model_ret["dipole_derv_c"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        return self._forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+
+    def forward_lower_exportable(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> torch.nn.Module:
+        model = self
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model._forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+                do_atomic_virial=do_atomic_virial,
+            )
+
+        return make_fx(fn)(
+            extended_coord, extended_atype, nlist, mapping, fparam, aparam
+        )
diff --git a/deepmd/pt_expt/model/dos_model.py b/deepmd/pt_expt/model/dos_model.py
new file mode 100644
index 0000000000..ac4b76f51d
--- /dev/null
+++ b/deepmd/pt_expt/model/dos_model.py
@@ -0,0 +1,139 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from typing import (
+    Any,
+)
+
+import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
+
+from deepmd.dpmodel.atomic_model import (
+    DPDOSAtomicModel,
+)
+from deepmd.dpmodel.model.dp_model import (
+    DPModelCommon,
+)
+
+from .make_model import (
+    make_model,
+)
+
+DPDOSModel_ = make_model(DPDOSAtomicModel)
+
+
+class DOSModel(DPModelCommon, DPDOSModel_):
+    model_type = "dos"
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        DPModelCommon.__init__(self)
+        DPDOSModel_.__init__(self, *args, **kwargs)
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common(
+            coord,
+            atype,
+            box,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["atom_dos"] = model_ret["dos"]
+        model_predict["dos"] = model_ret["dos_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def _forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["atom_dos"] = model_ret["dos"]
+        model_predict["dos"] = model_ret["dos_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        return self._forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+
+    def forward_lower_exportable(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> torch.nn.Module:
+        model = self
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model._forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+                do_atomic_virial=do_atomic_virial,
+            )
+
+        return make_fx(fn)(
+            extended_coord, extended_atype, nlist, mapping, fparam, aparam
+        )
diff --git a/deepmd/pt_expt/model/dp_zbl_model.py b/deepmd/pt_expt/model/dp_zbl_model.py
new file mode 100644
index 0000000000..857498aab9
--- /dev/null
+++ b/deepmd/pt_expt/model/dp_zbl_model.py
@@ -0,0 +1,153 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from typing import (
+    Any,
+)
+
+import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
+
+from deepmd.dpmodel.atomic_model.linear_atomic_model import (
+    DPZBLLinearEnergyAtomicModel,
+)
+from deepmd.dpmodel.model.dp_model import (
+    DPModelCommon,
+)
+
+from .make_model import (
+    make_model,
+)
+
+DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel)
+
+
+class DPZBLModel(DPModelCommon, DPZBLModel_):
+    model_type = "zbl"
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        DPModelCommon.__init__(self)
+        DPZBLModel_.__init__(self, *args, **kwargs)
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common(
+            coord,
+            atype,
+            box,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["atom_energy"] = model_ret["energy"]
+        model_predict["energy"] = model_ret["energy_redu"]
+        if self.do_grad_r("energy") and model_ret["energy_derv_r"] is not None:
+            model_predict["force"] = model_ret["energy_derv_r"].squeeze(-2)
+        if self.do_grad_c("energy") and model_ret["energy_derv_c_redu"] is not None:
+            model_predict["virial"] = model_ret["energy_derv_c_redu"].squeeze(-2)
+            if do_atomic_virial and model_ret["energy_derv_c"] is not None:
+                model_predict["atom_virial"] = model_ret["energy_derv_c"].squeeze(-2)
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def _forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["atom_energy"] = model_ret["energy"]
+        model_predict["energy"] = model_ret["energy_redu"]
+        if self.do_grad_r("energy") and model_ret.get("energy_derv_r") is not None:
+            model_predict["extended_force"] = model_ret["energy_derv_r"].squeeze(-2)
+        if self.do_grad_c("energy") and model_ret.get("energy_derv_c_redu") is not None:
+            model_predict["virial"] = model_ret["energy_derv_c_redu"].squeeze(-2)
+            if do_atomic_virial and model_ret.get("energy_derv_c") is not None:
+                model_predict["extended_virial"] = model_ret["energy_derv_c"].squeeze(
+                    -2
+                )
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        return self._forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+
+    def forward_lower_exportable(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> torch.nn.Module:
+        model = self
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model._forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+                do_atomic_virial=do_atomic_virial,
+            )
+
+        return make_fx(fn)(
+            extended_coord, extended_atype, nlist, mapping, fparam, aparam
+        )
diff --git a/deepmd/pt_expt/model/polar_model.py b/deepmd/pt_expt/model/polar_model.py
new file mode 100644
index 0000000000..8644940458
--- /dev/null
+++ b/deepmd/pt_expt/model/polar_model.py
@@ -0,0 +1,139 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from typing import (
+    Any,
+)
+
+import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
+
+from deepmd.dpmodel.atomic_model import (
+    DPPolarAtomicModel,
+)
+from deepmd.dpmodel.model.dp_model import (
+    DPModelCommon,
+)
+
+from .make_model import (
+    make_model,
+)
+
+DPPolarModel_ = make_model(DPPolarAtomicModel)
+
+
+class PolarModel(DPModelCommon, DPPolarModel_):
+    model_type = "polar"
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        DPModelCommon.__init__(self)
+        DPPolarModel_.__init__(self, *args, **kwargs)
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common(
+            coord,
+            atype,
+            box,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["polar"] = model_ret["polarizability"]
+        model_predict["global_polar"] = model_ret["polarizability_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def _forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        model_predict = {}
+        model_predict["polar"] = model_ret["polarizability"]
+        model_predict["global_polar"] = model_ret["polarizability_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        return self._forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+
+    def forward_lower_exportable(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> torch.nn.Module:
+        model = self
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model._forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+                do_atomic_virial=do_atomic_virial,
+            )
+
+        return make_fx(fn)(
+            extended_coord, extended_atype, nlist, mapping, fparam, aparam
+        )
diff --git a/deepmd/pt_expt/model/property_model.py b/deepmd/pt_expt/model/property_model.py
new file mode 100644
index 0000000000..1f78de4fdc
--- /dev/null
+++ b/deepmd/pt_expt/model/property_model.py
@@ -0,0 +1,145 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from typing import (
+    Any,
+)
+
+import torch
+from torch.fx.experimental.proxy_tensor import (
+    make_fx,
+)
+
+from deepmd.dpmodel.atomic_model import (
+    DPPropertyAtomicModel,
+)
+from deepmd.dpmodel.model.dp_model import (
+    DPModelCommon,
+)
+
+from .make_model import (
+    make_model,
+)
+
+DPPropertyModel_ = make_model(DPPropertyAtomicModel)
+
+
+class PropertyModel(DPModelCommon, DPPropertyModel_):
+    model_type = "property"
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        DPModelCommon.__init__(self)
+        DPPropertyModel_.__init__(self, *args, **kwargs)
+
+    def get_var_name(self) -> str:
+        """Get the name of the property."""
+        return self.get_fitting_net().var_name
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common(
+            coord,
+            atype,
+            box,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        var_name = self.get_var_name()
+        model_predict = {}
+        model_predict[f"atom_{var_name}"] = model_ret[var_name]
+        model_predict[var_name] = model_ret[f"{var_name}_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def _forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        model_ret = self.call_common_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+        var_name = self.get_var_name()
+        model_predict = {}
+        model_predict[f"atom_{var_name}"] = model_ret[var_name]
+        model_predict[var_name] = model_ret[f"{var_name}_redu"]
+        if "mask" in model_ret:
+            model_predict["mask"] = model_ret["mask"]
+        return model_predict
+
+    def forward_lower(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        return self._forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+            do_atomic_virial=do_atomic_virial,
+        )
+
+    def forward_lower_exportable(
+        self,
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> torch.nn.Module:
+        model = self
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model._forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+                do_atomic_virial=do_atomic_virial,
+            )
+
+        return make_fx(fn)(
+            extended_coord, extended_atype, nlist, mapping, fparam, aparam
+        )
diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index bcd199a633..e8de96a02d 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -15,6 +15,7 @@
 from ..common import (
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
 )
@@ -36,6 +37,10 @@
     from deepmd.jax.model.model import get_model as get_model_jax
 else:
     DipoleModelJAX = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import DipoleModel as DipoleModelPTExpt
+else:
+    DipoleModelPTExpt = None
 from deepmd.utils.argcheck import (
     model_args,
 )
@@ -71,6 +76,7 @@ def data(self) -> dict:
     tf_class = DipoleModelTF
     dp_class = DipoleModelDP
     pt_class = DipoleModelPT
+    pt_expt_class = DipoleModelPTExpt
     jax_class = DipoleModelJAX
     args = model_args()
     atol = 1e-8
@@ -84,6 +90,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_dp:
             return self.RefBackend.DP
         raise ValueError("No available reference")
@@ -105,6 +113,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             model = get_model_pt(data)
             model.atomic_model.out_bias.uniform_()
             return model
+        elif cls is DipoleModelPTExpt:
+            dp_model = get_model_dp(data)
+            return DipoleModelPTExpt.deserialize(dp_model.serialize())
         elif cls is DipoleModelJAX:
             return get_model_jax(data)
         return cls(**data, **self.additional_data)
@@ -177,6 +188,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_jax(self, jax_obj: Any) -> Any:
         return self.eval_jax_model(
             jax_obj,
@@ -196,6 +216,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
         elif backend in {
             self.RefBackend.DP,
             self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
             self.RefBackend.JAX,
         }:
             return (
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index f967973913..12472babb5 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -15,6 +15,7 @@
 from ..common import (
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
 )
@@ -36,6 +37,10 @@
     from deepmd.jax.model.model import get_model as get_model_jax
 else:
     DOSModelJAX = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import DOSModel as DOSModelPTExpt
+else:
+    DOSModelPTExpt = None
 from deepmd.utils.argcheck import (
     model_args,
 )
@@ -72,6 +77,7 @@ def data(self) -> dict:
     tf_class = DOSModelTF
     dp_class = DOSModelDP
     pt_class = DOSModelPT
+    pt_expt_class = DOSModelPTExpt
     jax_class = DOSModelJAX
     args = model_args()
 
@@ -84,6 +90,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_dp:
             return self.RefBackend.DP
         raise ValueError("No available reference")
@@ -105,6 +113,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             model = get_model_pt(data)
             model.atomic_model.out_bias.uniform_()
             return model
+        elif cls is DOSModelPTExpt:
+            dp_model = get_model_dp(data)
+            return DOSModelPTExpt.deserialize(dp_model.serialize())
         elif cls is DOSModelJAX:
             return get_model_jax(data)
         return cls(**data, **self.additional_data)
@@ -171,6 +182,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_jax(self, jax_obj: Any) -> Any:
         return self.eval_jax_model(
             jax_obj,
@@ -190,6 +210,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
         elif backend in {
             self.RefBackend.DP,
             self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
             self.RefBackend.JAX,
         }:
             return (
diff --git a/source/tests/consistent/model/test_dpa1.py b/source/tests/consistent/model/test_dpa1.py
index bacca12413..1662da1ccd 100644
--- a/source/tests/consistent/model/test_dpa1.py
+++ b/source/tests/consistent/model/test_dpa1.py
@@ -16,6 +16,7 @@
     INSTALLED_JAX,
     INSTALLED_PD,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     SKIP_FLAG,
     CommonTest,
@@ -43,6 +44,10 @@
     from deepmd.pd.model.model.ener_model import EnergyModel as EnergyModelPD
 else:
     EnergyModelPD = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import EnergyModel as EnergyModelPTExpt
+else:
+    EnergyModelPTExpt = None
 if INSTALLED_JAX:
     from deepmd.jax.model.ener_model import EnergyModel as EnergyModelJAX
     from deepmd.jax.model.model import get_model as get_model_jax
@@ -97,6 +102,7 @@ def data(self) -> dict:
     dp_class = EnergyModelDP
     pt_class = EnergyModelPT
     pd_class = EnergyModelPD
+    pt_expt_class = EnergyModelPTExpt
     jax_class = EnergyModelJAX
     args = model_args()
 
@@ -109,6 +115,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_pd:
             return self.RefBackend.PD
         if not self.skip_jax:
@@ -128,6 +136,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             return get_model_dp(data)
         elif cls is EnergyModelPT:
             return get_model_pt(data)
+        elif cls is EnergyModelPTExpt:
+            dp_model = get_model_dp(data)
+            return EnergyModelPTExpt.deserialize(dp_model.serialize())
         elif cls is EnergyModelPD:
             return get_model_pd(data)
         elif cls is EnergyModelJAX:
@@ -201,6 +212,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_pd(self, pd_obj: Any) -> Any:
         return self.eval_pd_model(
             pd_obj,
@@ -239,6 +259,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
             )
         elif backend in {
             self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
             self.RefBackend.PD,
             self.RefBackend.JAX,
         }:
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 0b9b94a599..1389cb33d7 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -15,6 +15,7 @@
 from ..common import (
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
 )
@@ -36,6 +37,10 @@
     from deepmd.jax.model.polar_model import PolarModel as PolarModelJAX
 else:
     PolarModelJAX = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import PolarModel as PolarModelPTExpt
+else:
+    PolarModelPTExpt = None
 from deepmd.utils.argcheck import (
     model_args,
 )
@@ -71,6 +76,7 @@ def data(self) -> dict:
     tf_class = PolarModelTF
     dp_class = PolarModelDP
     pt_class = PolarModelPT
+    pt_expt_class = PolarModelPTExpt
     jax_class = PolarModelJAX
     args = model_args()
     atol = 1e-8
@@ -84,6 +90,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_dp:
             return self.RefBackend.DP
         raise ValueError("No available reference")
@@ -105,6 +113,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             model = get_model_pt(data)
             model.atomic_model.out_bias.uniform_()
             return model
+        elif cls is PolarModelPTExpt:
+            dp_model = get_model_dp(data)
+            return PolarModelPTExpt.deserialize(dp_model.serialize())
         elif cls is PolarModelJAX:
             return get_model_jax(data)
         return cls(**data, **self.additional_data)
@@ -171,6 +182,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_jax(self, jax_obj: Any) -> Any:
         return self.eval_jax_model(
             jax_obj,
@@ -190,6 +210,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
         elif backend in {
             self.RefBackend.DP,
             self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
             self.RefBackend.JAX,
         }:
             return (
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 33e63af98e..ca2507a980 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -15,6 +15,7 @@
 from ..common import (
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     CommonTest,
 )
 from .common import (
@@ -31,6 +32,10 @@
     from deepmd.jax.model.property_model import PropertyModel as PropertyModelJAX
 else:
     PropertyModelJAX = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import PropertyModel as PropertyModelPTExpt
+else:
+    PropertyModelPTExpt = None
 from deepmd.utils.argcheck import (
     model_args,
 )
@@ -67,6 +72,7 @@ def data(self) -> dict:
     tf_class = None
     dp_class = PropertyModelDP
     pt_class = PropertyModelPT
+    pt_expt_class = PropertyModelPTExpt
     jax_class = PropertyModelJAX
     args = model_args()
 
@@ -79,6 +85,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_dp:
             return self.RefBackend.DP
         raise ValueError("No available reference")
@@ -100,6 +108,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             model = get_model_pt(data)
             model.atomic_model.out_bias.uniform_()
             return model
+        elif cls is PropertyModelPTExpt:
+            dp_model = get_model_dp(data)
+            return PropertyModelPTExpt.deserialize(dp_model.serialize())
         elif cls is PropertyModelJAX:
             return get_model_jax(data)
         return cls(**data, **self.additional_data)
@@ -172,6 +183,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_jax(self, jax_obj: Any) -> Any:
         return self.eval_jax_model(
             jax_obj,
@@ -184,7 +204,12 @@ def eval_jax(self, jax_obj: Any) -> Any:
     def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
         # shape not matched. ravel...
         property_name = self.data["fitting_net"]["property_name"]
-        if backend in {self.RefBackend.DP, self.RefBackend.PT, self.RefBackend.JAX}:
+        if backend in {
+            self.RefBackend.DP,
+            self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
+            self.RefBackend.JAX,
+        }:
             return (
                 ret[property_name].ravel(),
                 ret[f"atom_{property_name}"].ravel(),
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index 2783bb4a02..d6ceba73d3 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -15,6 +15,7 @@
 from ..common import (
     INSTALLED_JAX,
     INSTALLED_PT,
+    INSTALLED_PT_EXPT,
     SKIP_FLAG,
     CommonTest,
     parameterized,
@@ -33,6 +34,10 @@
     from deepmd.jax.model.model import get_model as get_model_jax
 else:
     DPZBLModelJAX = None
+if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.model import DPZBLModel as DPZBLModelPTExpt
+else:
+    DPZBLModelPTExpt = None
 import os
 
 from deepmd.utils.argcheck import (
@@ -92,6 +97,7 @@ def data(self) -> dict:
 
     dp_class = DPZBLModelDP
     pt_class = DPZBLModelPT
+    pt_expt_class = DPZBLModelPTExpt
     jax_class = DPZBLModelJAX
     args = model_args()
 
@@ -104,6 +110,8 @@ def get_reference_backend(self):
             return self.RefBackend.PT
         if not self.skip_tf:
             return self.RefBackend.TF
+        if not self.skip_pt_expt and self.pt_expt_class is not None:
+            return self.RefBackend.PT_EXPT
         if not self.skip_jax:
             return self.RefBackend.JAX
         if not self.skip_dp:
@@ -125,6 +133,9 @@ def pass_data_to_cls(self, cls, data) -> Any:
             return get_model_dp(data)
         elif cls is DPZBLModelPT:
             return get_model_pt(data)
+        elif cls is DPZBLModelPTExpt:
+            dp_model = get_model_dp(data)
+            return DPZBLModelPTExpt.deserialize(dp_model.serialize())
         elif cls is DPZBLModelJAX:
             return get_model_jax(data)
         return cls(**data, **self.additional_data)
@@ -196,6 +207,15 @@ def eval_pt(self, pt_obj: Any) -> Any:
             self.box,
         )
 
+    def eval_pt_expt(self, pt_expt_obj: Any) -> Any:
+        return self.eval_pt_expt_model(
+            pt_expt_obj,
+            self.natoms,
+            self.coords,
+            self.atype,
+            self.box,
+        )
+
     def eval_jax(self, jax_obj: Any) -> Any:
         return self.eval_jax_model(
             jax_obj,
@@ -218,6 +238,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
             )
         elif backend in {
             self.RefBackend.PT,
+            self.RefBackend.PT_EXPT,
             self.RefBackend.JAX,
         }:
             return (
diff --git a/source/tests/pt_expt/model/test_dipole_model.py b/source/tests/pt_expt/model/test_dipole_model.py
new file mode 100644
index 0000000000..74752af535
--- /dev/null
+++ b/source/tests/pt_expt/model/test_dipole_model.py
@@ -0,0 +1,187 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import DescrptSeA as DPDescrptSeA
+from deepmd.dpmodel.fitting import DipoleFitting as DPDipoleFitting
+from deepmd.dpmodel.model.dipole_model import DipoleModel as DPDipoleModel
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.pt_expt.model import (
+    DipoleModel,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestDipoleModel(unittest.TestCase):
+    def setUp(self) -> None:
+        self.device = env.DEVICE
+        self.natoms = 5
+        self.rcut = 4.0
+        self.rcut_smth = 0.5
+        self.sel = [8, 6]
+        self.nt = 2
+        self.type_map = ["foo", "bar"]
+
+        generator = torch.Generator(device=self.device).manual_seed(GLOBAL_SEED)
+        cell = torch.rand(
+            [3, 3], dtype=torch.float64, device=self.device, generator=generator
+        )
+        cell = (cell + cell.T) + 5.0 * torch.eye(3, device=self.device)
+        self.cell = cell.unsqueeze(0)
+        coord = torch.rand(
+            [self.natoms, 3],
+            dtype=torch.float64,
+            device=self.device,
+            generator=generator,
+        )
+        coord = torch.matmul(coord, cell)
+        self.coord = coord.unsqueeze(0).to(self.device)
+        self.atype = torch.tensor(
+            [[0, 0, 0, 1, 1]], dtype=torch.int64, device=self.device
+        )
+
+    def _make_dp_model(self):
+        ds = DPDescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        ft = DPDipoleFitting(
+            self.nt,
+            ds.get_dim_out(),
+            embedding_width=ds.get_dim_emb(),
+            seed=GLOBAL_SEED,
+        )
+        return DPDipoleModel(ds, ft, type_map=self.type_map)
+
+    def _prepare_lower_inputs(self):
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        coord_normalized = normalize_coord(
+            coord_np.reshape(1, self.natoms, 3),
+            cell_np.reshape(1, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, atype_np, cell_np, self.rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            self.natoms,
+            self.rcut,
+            self.sel,
+            distinguish_types=True,
+        )
+        extended_coord = extended_coord.reshape(1, -1, 3)
+        return (
+            torch.tensor(extended_coord, dtype=torch.float64, device=self.device),
+            torch.tensor(extended_atype, dtype=torch.int64, device=self.device),
+            torch.tensor(nlist, dtype=torch.int64, device=self.device),
+            torch.tensor(mapping, dtype=torch.int64, device=self.device),
+        )
+
+    def test_dp_consistency(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DipoleModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        ret_dp = md_dp(coord_np.reshape(1, -1), atype_np, cell_np)
+
+        coord = self.coord.clone().requires_grad_(True)
+        ret_pt = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+
+        np.testing.assert_allclose(
+            ret_dp["global_dipole"],
+            ret_pt["global_dipole"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            ret_dp["dipole"],
+            ret_pt["dipole"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_output_keys(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DipoleModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+        coord = self.coord.clone().requires_grad_(True)
+        ret = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+        self.assertIn("dipole", ret)
+        self.assertIn("global_dipole", ret)
+
+    def test_forward_lower_exportable(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DipoleModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        ext_coord, ext_atype, nlist_t, mapping_t = self._prepare_lower_inputs()
+        fparam = None
+        aparam = None
+
+        ret_eager = md_pt._forward_lower(
+            ext_coord.requires_grad_(True),
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+        traced = md_pt.forward_lower_exportable(
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+        self.assertIsInstance(traced, torch.nn.Module)
+
+        exported = torch.export.export(
+            traced,
+            (ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam),
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_traced = traced(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        ret_exported = exported.module()(
+            ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam
+        )
+
+        for key in ("dipole", "global_dipole"):
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_traced[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"traced vs eager: {key}",
+            )
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_exported[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"exported vs eager: {key}",
+            )
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/model/test_dos_model.py b/source/tests/pt_expt/model/test_dos_model.py
new file mode 100644
index 0000000000..37c8262fda
--- /dev/null
+++ b/source/tests/pt_expt/model/test_dos_model.py
@@ -0,0 +1,187 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import DescrptSeA as DPDescrptSeA
+from deepmd.dpmodel.fitting import DOSFittingNet as DPDOSFittingNet
+from deepmd.dpmodel.model.dos_model import DOSModel as DPDOSModel
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.pt_expt.model import (
+    DOSModel,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestDOSModel(unittest.TestCase):
+    def setUp(self) -> None:
+        self.device = env.DEVICE
+        self.natoms = 5
+        self.rcut = 4.0
+        self.rcut_smth = 0.5
+        self.sel = [8, 6]
+        self.nt = 2
+        self.type_map = ["foo", "bar"]
+
+        generator = torch.Generator(device=self.device).manual_seed(GLOBAL_SEED)
+        cell = torch.rand(
+            [3, 3], dtype=torch.float64, device=self.device, generator=generator
+        )
+        cell = (cell + cell.T) + 5.0 * torch.eye(3, device=self.device)
+        self.cell = cell.unsqueeze(0)
+        coord = torch.rand(
+            [self.natoms, 3],
+            dtype=torch.float64,
+            device=self.device,
+            generator=generator,
+        )
+        coord = torch.matmul(coord, cell)
+        self.coord = coord.unsqueeze(0).to(self.device)
+        self.atype = torch.tensor(
+            [[0, 0, 0, 1, 1]], dtype=torch.int64, device=self.device
+        )
+
+    def _make_dp_model(self):
+        ds = DPDescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        ft = DPDOSFittingNet(
+            self.nt,
+            ds.get_dim_out(),
+            numb_dos=10,
+            seed=GLOBAL_SEED,
+        )
+        return DPDOSModel(ds, ft, type_map=self.type_map)
+
+    def _prepare_lower_inputs(self):
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        coord_normalized = normalize_coord(
+            coord_np.reshape(1, self.natoms, 3),
+            cell_np.reshape(1, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, atype_np, cell_np, self.rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            self.natoms,
+            self.rcut,
+            self.sel,
+            distinguish_types=True,
+        )
+        extended_coord = extended_coord.reshape(1, -1, 3)
+        return (
+            torch.tensor(extended_coord, dtype=torch.float64, device=self.device),
+            torch.tensor(extended_atype, dtype=torch.int64, device=self.device),
+            torch.tensor(nlist, dtype=torch.int64, device=self.device),
+            torch.tensor(mapping, dtype=torch.int64, device=self.device),
+        )
+
+    def test_dp_consistency(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DOSModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        ret_dp = md_dp(coord_np.reshape(1, -1), atype_np, cell_np)
+
+        coord = self.coord.clone().requires_grad_(True)
+        ret_pt = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+
+        np.testing.assert_allclose(
+            ret_dp["dos"],
+            ret_pt["dos"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            ret_dp["atom_dos"],
+            ret_pt["atom_dos"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_output_keys(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DOSModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+        coord = self.coord.clone().requires_grad_(True)
+        ret = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+        self.assertIn("dos", ret)
+        self.assertIn("atom_dos", ret)
+
+    def test_forward_lower_exportable(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DOSModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        ext_coord, ext_atype, nlist_t, mapping_t = self._prepare_lower_inputs()
+        fparam = None
+        aparam = None
+
+        ret_eager = md_pt._forward_lower(
+            ext_coord.requires_grad_(True),
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+        traced = md_pt.forward_lower_exportable(
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+        self.assertIsInstance(traced, torch.nn.Module)
+
+        exported = torch.export.export(
+            traced,
+            (ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam),
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_traced = traced(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        ret_exported = exported.module()(
+            ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam
+        )
+
+        for key in ("atom_dos", "dos"):
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_traced[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"traced vs eager: {key}",
+            )
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_exported[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"exported vs eager: {key}",
+            )
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/model/test_dp_zbl_model.py b/source/tests/pt_expt/model/test_dp_zbl_model.py
new file mode 100644
index 0000000000..534fc01d78
--- /dev/null
+++ b/source/tests/pt_expt/model/test_dp_zbl_model.py
@@ -0,0 +1,237 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import os
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.atomic_model import (
+    DPAtomicModel,
+)
+from deepmd.dpmodel.atomic_model.pairtab_atomic_model import (
+    PairTabAtomicModel,
+)
+from deepmd.dpmodel.descriptor import DescrptDPA1 as DPDescrptDPA1
+from deepmd.dpmodel.fitting import InvarFitting as DPInvarFitting
+from deepmd.dpmodel.model.dp_zbl_model import DPZBLModel as DPDPZBLModel
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.pt_expt.model import (
+    DPZBLModel,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+TESTS_DIR = os.path.dirname(os.path.dirname(os.path.dirname(__file__)))
+TAB_FILE = os.path.join(
+    TESTS_DIR,
+    "pt",
+    "model",
+    "water",
+    "data",
+    "zbl_tab_potential",
+    "H2O_tab_potential.txt",
+)
+
+
+class TestDPZBLModel(unittest.TestCase):
+    def setUp(self) -> None:
+        self.device = env.DEVICE
+        self.natoms = 5
+        self.rcut = 4.0
+        self.rcut_smth = 0.5
+        self.sel = 20
+        self.nt = 3
+        self.type_map = ["O", "H", "B"]
+
+        generator = torch.Generator(device=self.device).manual_seed(GLOBAL_SEED)
+        cell = torch.rand(
+            [3, 3], dtype=torch.float64, device=self.device, generator=generator
+        )
+        cell = (cell + cell.T) + 5.0 * torch.eye(3, device=self.device)
+        self.cell = cell.unsqueeze(0)
+        coord = torch.rand(
+            [self.natoms, 3],
+            dtype=torch.float64,
+            device=self.device,
+            generator=generator,
+        )
+        coord = torch.matmul(coord, cell)
+        self.coord = coord.unsqueeze(0).to(self.device)
+        self.atype = torch.tensor(
+            [[0, 0, 1, 1, 2]], dtype=torch.int64, device=self.device
+        )
+
+    def _make_dp_model(self):
+        ds = DPDescrptDPA1(
+            rcut_smth=self.rcut_smth,
+            rcut=self.rcut,
+            sel=self.sel,
+            ntypes=self.nt,
+            neuron=[3, 6],
+            axis_neuron=2,
+            attn=4,
+            attn_layer=2,
+            attn_dotr=True,
+            attn_mask=False,
+            activation_function="tanh",
+            set_davg_zero=True,
+            type_one_side=True,
+            seed=GLOBAL_SEED,
+        )
+        ft = DPInvarFitting(
+            "energy",
+            self.nt,
+            ds.get_dim_out(),
+            1,
+            mixed_types=ds.mixed_types(),
+            seed=GLOBAL_SEED,
+        )
+        dp_model = DPAtomicModel(ds, ft, type_map=self.type_map)
+        zbl_model = PairTabAtomicModel(
+            tab_file=TAB_FILE,
+            rcut=self.rcut,
+            sel=self.sel,
+            type_map=self.type_map,
+        )
+        return DPDPZBLModel(
+            dp_model,
+            zbl_model,
+            sw_rmin=0.2,
+            sw_rmax=4.0,
+            type_map=self.type_map,
+        )
+
+    def _prepare_lower_inputs(self):
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        coord_normalized = normalize_coord(
+            coord_np.reshape(1, self.natoms, 3),
+            cell_np.reshape(1, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, atype_np, cell_np, self.rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            self.natoms,
+            self.rcut,
+            [self.sel],
+            distinguish_types=False,
+        )
+        extended_coord = extended_coord.reshape(1, -1, 3)
+        return (
+            torch.tensor(extended_coord, dtype=torch.float64, device=self.device),
+            torch.tensor(extended_atype, dtype=torch.int64, device=self.device),
+            torch.tensor(nlist, dtype=torch.int64, device=self.device),
+            torch.tensor(mapping, dtype=torch.int64, device=self.device),
+        )
+
+    def test_dp_consistency(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DPZBLModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        ret_dp = md_dp(coord_np.reshape(1, -1), atype_np, cell_np)
+
+        coord = self.coord.clone().requires_grad_(True)
+        ret_pt = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+
+        np.testing.assert_allclose(
+            ret_dp["energy"],
+            ret_pt["energy"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            ret_dp["atom_energy"],
+            ret_pt["atom_energy"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_output_keys(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DPZBLModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+        coord = self.coord.clone().requires_grad_(True)
+        ret = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+        self.assertIn("energy", ret)
+        self.assertIn("atom_energy", ret)
+        self.assertIn("force", ret)
+        self.assertIn("virial", ret)
+
+    def test_forward_lower_exportable(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = DPZBLModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        ext_coord, ext_atype, nlist_t, mapping_t = self._prepare_lower_inputs()
+        fparam = None
+        aparam = None
+
+        ret_eager = md_pt._forward_lower(
+            ext_coord.requires_grad_(True),
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+        traced = md_pt.forward_lower_exportable(
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+        self.assertIsInstance(traced, torch.nn.Module)
+
+        exported = torch.export.export(
+            traced,
+            (ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam),
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_traced = traced(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        ret_exported = exported.module()(
+            ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam
+        )
+
+        for key in ("atom_energy", "energy"):
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_traced[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"traced vs eager: {key}",
+            )
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_exported[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"exported vs eager: {key}",
+            )
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/model/test_polar_model.py b/source/tests/pt_expt/model/test_polar_model.py
new file mode 100644
index 0000000000..f18b831d44
--- /dev/null
+++ b/source/tests/pt_expt/model/test_polar_model.py
@@ -0,0 +1,187 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import DescrptSeA as DPDescrptSeA
+from deepmd.dpmodel.fitting import PolarFitting as DPPolarFitting
+from deepmd.dpmodel.model.polar_model import PolarModel as DPPolarModel
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.pt_expt.model import (
+    PolarModel,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestPolarModel(unittest.TestCase):
+    def setUp(self) -> None:
+        self.device = env.DEVICE
+        self.natoms = 5
+        self.rcut = 4.0
+        self.rcut_smth = 0.5
+        self.sel = [8, 6]
+        self.nt = 2
+        self.type_map = ["foo", "bar"]
+
+        generator = torch.Generator(device=self.device).manual_seed(GLOBAL_SEED)
+        cell = torch.rand(
+            [3, 3], dtype=torch.float64, device=self.device, generator=generator
+        )
+        cell = (cell + cell.T) + 5.0 * torch.eye(3, device=self.device)
+        self.cell = cell.unsqueeze(0)
+        coord = torch.rand(
+            [self.natoms, 3],
+            dtype=torch.float64,
+            device=self.device,
+            generator=generator,
+        )
+        coord = torch.matmul(coord, cell)
+        self.coord = coord.unsqueeze(0).to(self.device)
+        self.atype = torch.tensor(
+            [[0, 0, 0, 1, 1]], dtype=torch.int64, device=self.device
+        )
+
+    def _make_dp_model(self):
+        ds = DPDescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        ft = DPPolarFitting(
+            self.nt,
+            ds.get_dim_out(),
+            embedding_width=ds.get_dim_emb(),
+            seed=GLOBAL_SEED,
+        )
+        return DPPolarModel(ds, ft, type_map=self.type_map)
+
+    def _prepare_lower_inputs(self):
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        coord_normalized = normalize_coord(
+            coord_np.reshape(1, self.natoms, 3),
+            cell_np.reshape(1, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, atype_np, cell_np, self.rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            self.natoms,
+            self.rcut,
+            self.sel,
+            distinguish_types=True,
+        )
+        extended_coord = extended_coord.reshape(1, -1, 3)
+        return (
+            torch.tensor(extended_coord, dtype=torch.float64, device=self.device),
+            torch.tensor(extended_atype, dtype=torch.int64, device=self.device),
+            torch.tensor(nlist, dtype=torch.int64, device=self.device),
+            torch.tensor(mapping, dtype=torch.int64, device=self.device),
+        )
+
+    def test_dp_consistency(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PolarModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        ret_dp = md_dp(coord_np.reshape(1, -1), atype_np, cell_np)
+
+        coord = self.coord.clone().requires_grad_(True)
+        ret_pt = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+
+        np.testing.assert_allclose(
+            ret_dp["global_polar"],
+            ret_pt["global_polar"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            ret_dp["polar"],
+            ret_pt["polar"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_output_keys(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PolarModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+        coord = self.coord.clone().requires_grad_(True)
+        ret = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+        self.assertIn("polar", ret)
+        self.assertIn("global_polar", ret)
+
+    def test_forward_lower_exportable(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PolarModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        ext_coord, ext_atype, nlist_t, mapping_t = self._prepare_lower_inputs()
+        fparam = None
+        aparam = None
+
+        ret_eager = md_pt._forward_lower(
+            ext_coord.requires_grad_(True),
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+        traced = md_pt.forward_lower_exportable(
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+        self.assertIsInstance(traced, torch.nn.Module)
+
+        exported = torch.export.export(
+            traced,
+            (ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam),
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_traced = traced(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        ret_exported = exported.module()(
+            ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam
+        )
+
+        for key in ("polar", "global_polar"):
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_traced[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"traced vs eager: {key}",
+            )
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_exported[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"exported vs eager: {key}",
+            )
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/model/test_property_model.py b/source/tests/pt_expt/model/test_property_model.py
new file mode 100644
index 0000000000..27c144ef7a
--- /dev/null
+++ b/source/tests/pt_expt/model/test_property_model.py
@@ -0,0 +1,190 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import unittest
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.descriptor import DescrptSeA as DPDescrptSeA
+from deepmd.dpmodel.fitting import PropertyFittingNet as DPPropertyFittingNet
+from deepmd.dpmodel.model.property_model import PropertyModel as DPPropertyModel
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.pt_expt.model import (
+    PropertyModel,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+class TestPropertyModel(unittest.TestCase):
+    def setUp(self) -> None:
+        self.device = env.DEVICE
+        self.natoms = 5
+        self.rcut = 4.0
+        self.rcut_smth = 0.5
+        self.sel = [8, 6]
+        self.nt = 2
+        self.type_map = ["foo", "bar"]
+
+        generator = torch.Generator(device=self.device).manual_seed(GLOBAL_SEED)
+        cell = torch.rand(
+            [3, 3], dtype=torch.float64, device=self.device, generator=generator
+        )
+        cell = (cell + cell.T) + 5.0 * torch.eye(3, device=self.device)
+        self.cell = cell.unsqueeze(0)
+        coord = torch.rand(
+            [self.natoms, 3],
+            dtype=torch.float64,
+            device=self.device,
+            generator=generator,
+        )
+        coord = torch.matmul(coord, cell)
+        self.coord = coord.unsqueeze(0).to(self.device)
+        self.atype = torch.tensor(
+            [[0, 0, 0, 1, 1]], dtype=torch.int64, device=self.device
+        )
+
+    def _make_dp_model(self):
+        ds = DPDescrptSeA(self.rcut, self.rcut_smth, self.sel)
+        ft = DPPropertyFittingNet(
+            self.nt,
+            ds.get_dim_out(),
+            task_dim=3,
+            seed=GLOBAL_SEED,
+        )
+        return DPPropertyModel(ds, ft, type_map=self.type_map)
+
+    def _prepare_lower_inputs(self):
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        coord_normalized = normalize_coord(
+            coord_np.reshape(1, self.natoms, 3),
+            cell_np.reshape(1, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, atype_np, cell_np, self.rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            self.natoms,
+            self.rcut,
+            self.sel,
+            distinguish_types=True,
+        )
+        extended_coord = extended_coord.reshape(1, -1, 3)
+        return (
+            torch.tensor(extended_coord, dtype=torch.float64, device=self.device),
+            torch.tensor(extended_atype, dtype=torch.int64, device=self.device),
+            torch.tensor(nlist, dtype=torch.int64, device=self.device),
+            torch.tensor(mapping, dtype=torch.int64, device=self.device),
+        )
+
+    def test_dp_consistency(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PropertyModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        coord_np = self.coord.detach().cpu().numpy()
+        atype_np = self.atype.detach().cpu().numpy()
+        cell_np = self.cell.reshape(1, 9).detach().cpu().numpy()
+        ret_dp = md_dp(coord_np.reshape(1, -1), atype_np, cell_np)
+
+        coord = self.coord.clone().requires_grad_(True)
+        ret_pt = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+
+        var_name = md_pt.get_var_name()
+        np.testing.assert_allclose(
+            ret_dp[var_name],
+            ret_pt[var_name].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            ret_dp[f"atom_{var_name}"],
+            ret_pt[f"atom_{var_name}"].detach().cpu().numpy(),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_output_keys(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PropertyModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+        coord = self.coord.clone().requires_grad_(True)
+        ret = md_pt(coord, self.atype, self.cell.reshape(1, 9))
+        var_name = md_pt.get_var_name()
+        self.assertIn(var_name, ret)
+        self.assertIn(f"atom_{var_name}", ret)
+
+    def test_forward_lower_exportable(self) -> None:
+        md_dp = self._make_dp_model()
+        md_pt = PropertyModel.deserialize(md_dp.serialize()).to(self.device)
+        md_pt.eval()
+
+        ext_coord, ext_atype, nlist_t, mapping_t = self._prepare_lower_inputs()
+        fparam = None
+        aparam = None
+
+        ret_eager = md_pt._forward_lower(
+            ext_coord.requires_grad_(True),
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+        traced = md_pt.forward_lower_exportable(
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam=fparam,
+            aparam=aparam,
+        )
+        self.assertIsInstance(traced, torch.nn.Module)
+
+        exported = torch.export.export(
+            traced,
+            (ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam),
+            strict=False,
+        )
+        self.assertIsNotNone(exported)
+
+        ret_traced = traced(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        ret_exported = exported.module()(
+            ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam
+        )
+
+        var_name = md_pt.get_var_name()
+        for key in (f"atom_{var_name}", var_name):
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_traced[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"traced vs eager: {key}",
+            )
+            np.testing.assert_allclose(
+                ret_eager[key].detach().cpu().numpy(),
+                ret_exported[key].detach().cpu().numpy(),
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"exported vs eager: {key}",
+            )
+
+
+if __name__ == "__main__":
+    unittest.main()

From 553b91d56cb47c1b77a13f368cd8d6109644c7d0 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 21:45:07 +0800
Subject: [PATCH 04/63] rm _forward_lower

---
 deepmd/pt_expt/model/dipole_model.py          | 24 ++---------------
 deepmd/pt_expt/model/dos_model.py             | 24 ++---------------
 deepmd/pt_expt/model/dp_zbl_model.py          | 24 ++---------------
 deepmd/pt_expt/model/ener_model.py            | 26 +++----------------
 deepmd/pt_expt/model/polar_model.py           | 24 ++---------------
 deepmd/pt_expt/model/property_model.py        | 24 ++---------------
 .../tests/pt_expt/model/test_dipole_model.py  |  2 +-
 source/tests/pt_expt/model/test_dos_model.py  |  2 +-
 .../tests/pt_expt/model/test_dp_zbl_model.py  |  2 +-
 source/tests/pt_expt/model/test_ener_model.py |  4 +--
 .../tests/pt_expt/model/test_polar_model.py   |  2 +-
 .../pt_expt/model/test_property_model.py      |  2 +-
 12 files changed, 20 insertions(+), 140 deletions(-)

diff --git a/deepmd/pt_expt/model/dipole_model.py b/deepmd/pt_expt/model/dipole_model.py
index 5839120c72..a2830be7a3 100644
--- a/deepmd/pt_expt/model/dipole_model.py
+++ b/deepmd/pt_expt/model/dipole_model.py
@@ -63,7 +63,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -95,26 +95,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -136,7 +116,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/deepmd/pt_expt/model/dos_model.py b/deepmd/pt_expt/model/dos_model.py
index ac4b76f51d..82991cdb59 100644
--- a/deepmd/pt_expt/model/dos_model.py
+++ b/deepmd/pt_expt/model/dos_model.py
@@ -57,7 +57,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -83,26 +83,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -124,7 +104,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/deepmd/pt_expt/model/dp_zbl_model.py b/deepmd/pt_expt/model/dp_zbl_model.py
index 857498aab9..83dbd900e3 100644
--- a/deepmd/pt_expt/model/dp_zbl_model.py
+++ b/deepmd/pt_expt/model/dp_zbl_model.py
@@ -63,7 +63,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -97,26 +97,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -138,7 +118,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/deepmd/pt_expt/model/ener_model.py b/deepmd/pt_expt/model/ener_model.py
index 5f30f3a227..fa07f3e3b2 100644
--- a/deepmd/pt_expt/model/ener_model.py
+++ b/deepmd/pt_expt/model/ener_model.py
@@ -63,7 +63,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -97,26 +97,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -127,7 +107,7 @@ def forward_lower_exportable(
         aparam: torch.Tensor | None = None,
         do_atomic_virial: bool = False,
     ) -> torch.nn.Module:
-        """Trace ``_forward_lower`` into an exportable module.
+        """Trace ``forward_lower`` into an exportable module.
 
         Uses ``make_fx`` to trace through ``torch.autograd.grad``,
         decomposing the backward pass into primitive ops.  The returned
@@ -156,7 +136,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/deepmd/pt_expt/model/polar_model.py b/deepmd/pt_expt/model/polar_model.py
index 8644940458..337c4771cd 100644
--- a/deepmd/pt_expt/model/polar_model.py
+++ b/deepmd/pt_expt/model/polar_model.py
@@ -57,7 +57,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -83,26 +83,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -124,7 +104,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/deepmd/pt_expt/model/property_model.py b/deepmd/pt_expt/model/property_model.py
index 1f78de4fdc..61d99b3840 100644
--- a/deepmd/pt_expt/model/property_model.py
+++ b/deepmd/pt_expt/model/property_model.py
@@ -62,7 +62,7 @@ def forward(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def _forward_lower(
+    def forward_lower(
         self,
         extended_coord: torch.Tensor,
         extended_atype: torch.Tensor,
@@ -89,26 +89,6 @@ def _forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
-    def forward_lower(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-        do_atomic_virial: bool = False,
-    ) -> dict[str, torch.Tensor]:
-        return self._forward_lower(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping,
-            fparam=fparam,
-            aparam=aparam,
-            do_atomic_virial=do_atomic_virial,
-        )
-
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
@@ -130,7 +110,7 @@ def fn(
             aparam: torch.Tensor | None,
         ) -> dict[str, torch.Tensor]:
             extended_coord = extended_coord.detach().requires_grad_(True)
-            return model._forward_lower(
+            return model.forward_lower(
                 extended_coord,
                 extended_atype,
                 nlist,
diff --git a/source/tests/pt_expt/model/test_dipole_model.py b/source/tests/pt_expt/model/test_dipole_model.py
index 74752af535..4dafd9d0ae 100644
--- a/source/tests/pt_expt/model/test_dipole_model.py
+++ b/source/tests/pt_expt/model/test_dipole_model.py
@@ -135,7 +135,7 @@ def test_forward_lower_exportable(self) -> None:
         fparam = None
         aparam = None
 
-        ret_eager = md_pt._forward_lower(
+        ret_eager = md_pt.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
diff --git a/source/tests/pt_expt/model/test_dos_model.py b/source/tests/pt_expt/model/test_dos_model.py
index 37c8262fda..993c55972b 100644
--- a/source/tests/pt_expt/model/test_dos_model.py
+++ b/source/tests/pt_expt/model/test_dos_model.py
@@ -135,7 +135,7 @@ def test_forward_lower_exportable(self) -> None:
         fparam = None
         aparam = None
 
-        ret_eager = md_pt._forward_lower(
+        ret_eager = md_pt.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
diff --git a/source/tests/pt_expt/model/test_dp_zbl_model.py b/source/tests/pt_expt/model/test_dp_zbl_model.py
index 534fc01d78..1fa1d332e5 100644
--- a/source/tests/pt_expt/model/test_dp_zbl_model.py
+++ b/source/tests/pt_expt/model/test_dp_zbl_model.py
@@ -185,7 +185,7 @@ def test_forward_lower_exportable(self) -> None:
         fparam = None
         aparam = None
 
-        ret_eager = md_pt._forward_lower(
+        ret_eager = md_pt.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
diff --git a/source/tests/pt_expt/model/test_ener_model.py b/source/tests/pt_expt/model/test_ener_model.py
index 588b0ec2a9..f4fd9106e8 100644
--- a/source/tests/pt_expt/model/test_ener_model.py
+++ b/source/tests/pt_expt/model/test_ener_model.py
@@ -184,7 +184,7 @@ def test_forward_lower_exportable(self) -> None:
         )
 
         # --- eager reference with zero params ---
-        ret_eager_zero = md._forward_lower(
+        ret_eager_zero = md.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
@@ -262,7 +262,7 @@ def test_forward_lower_exportable(self) -> None:
             dtype=torch.float64,
             device=self.device,
         )
-        ret_eager_nz = md._forward_lower(
+        ret_eager_nz = md.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
diff --git a/source/tests/pt_expt/model/test_polar_model.py b/source/tests/pt_expt/model/test_polar_model.py
index f18b831d44..acfa929db2 100644
--- a/source/tests/pt_expt/model/test_polar_model.py
+++ b/source/tests/pt_expt/model/test_polar_model.py
@@ -135,7 +135,7 @@ def test_forward_lower_exportable(self) -> None:
         fparam = None
         aparam = None
 
-        ret_eager = md_pt._forward_lower(
+        ret_eager = md_pt.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,
diff --git a/source/tests/pt_expt/model/test_property_model.py b/source/tests/pt_expt/model/test_property_model.py
index 27c144ef7a..12b12afea1 100644
--- a/source/tests/pt_expt/model/test_property_model.py
+++ b/source/tests/pt_expt/model/test_property_model.py
@@ -137,7 +137,7 @@ def test_forward_lower_exportable(self) -> None:
         fparam = None
         aparam = None
 
-        ret_eager = md_pt._forward_lower(
+        ret_eager = md_pt.forward_lower(
             ext_coord.requires_grad_(True),
             ext_atype,
             nlist_t,

From 0753cd715756b33925cb1207db2e002dab5e61f4 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 22:31:46 +0800
Subject: [PATCH 05/63] rm register_dpmodel_mapping from fitting

---
 deepmd/pt_expt/fitting/dipole_fitting.py         |  7 -------
 deepmd/pt_expt/fitting/dos_fitting.py            |  7 -------
 deepmd/pt_expt/fitting/ener_fitting.py           | 12 ------------
 deepmd/pt_expt/fitting/invar_fitting.py          |  7 -------
 deepmd/pt_expt/fitting/polarizability_fitting.py |  7 -------
 deepmd/pt_expt/fitting/property_fitting.py       |  7 -------
 6 files changed, 47 deletions(-)

diff --git a/deepmd/pt_expt/fitting/dipole_fitting.py b/deepmd/pt_expt/fitting/dipole_fitting.py
index a16a96fe72..23a10432da 100644
--- a/deepmd/pt_expt/fitting/dipole_fitting.py
+++ b/deepmd/pt_expt/fitting/dipole_fitting.py
@@ -2,7 +2,6 @@
 
 from deepmd.dpmodel.fitting.dipole_fitting import DipoleFitting as DipoleFittingDP
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 
@@ -15,9 +14,3 @@
 @torch_module
 class DipoleFitting(DipoleFittingDP):
     pass
-
-
-register_dpmodel_mapping(
-    DipoleFittingDP,
-    lambda v: DipoleFitting.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/fitting/dos_fitting.py b/deepmd/pt_expt/fitting/dos_fitting.py
index 8c51fcc0eb..c42511bfe6 100644
--- a/deepmd/pt_expt/fitting/dos_fitting.py
+++ b/deepmd/pt_expt/fitting/dos_fitting.py
@@ -2,7 +2,6 @@
 
 from deepmd.dpmodel.fitting.dos_fitting import DOSFittingNet as DOSFittingNetDP
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 
@@ -15,9 +14,3 @@
 @torch_module
 class DOSFittingNet(DOSFittingNetDP):
     pass
-
-
-register_dpmodel_mapping(
-    DOSFittingNetDP,
-    lambda v: DOSFittingNet.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/fitting/ener_fitting.py b/deepmd/pt_expt/fitting/ener_fitting.py
index f9779e44af..f778af8fec 100644
--- a/deepmd/pt_expt/fitting/ener_fitting.py
+++ b/deepmd/pt_expt/fitting/ener_fitting.py
@@ -2,7 +2,6 @@
 
 from deepmd.dpmodel.fitting.ener_fitting import EnergyFittingNet as EnergyFittingNetDP
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 
@@ -14,15 +13,4 @@
 @BaseFitting.register("ener")
 @torch_module
 class EnergyFittingNet(EnergyFittingNetDP):
-    """Energy fitting net for pt_expt backend.
-
-    This inherits from dpmodel EnergyFittingNet to get the correct serialize() method.
-    """
-
     pass
-
-
-register_dpmodel_mapping(
-    EnergyFittingNetDP,
-    lambda v: EnergyFittingNet.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/fitting/invar_fitting.py b/deepmd/pt_expt/fitting/invar_fitting.py
index ab908ebe0d..f13fe2afbb 100644
--- a/deepmd/pt_expt/fitting/invar_fitting.py
+++ b/deepmd/pt_expt/fitting/invar_fitting.py
@@ -2,7 +2,6 @@
 
 from deepmd.dpmodel.fitting.invar_fitting import InvarFitting as InvarFittingDP
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 from deepmd.pt_expt.fitting.base_fitting import (
@@ -14,9 +13,3 @@
 @torch_module
 class InvarFitting(InvarFittingDP):
     pass
-
-
-register_dpmodel_mapping(
-    InvarFittingDP,
-    lambda v: InvarFitting.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/fitting/polarizability_fitting.py b/deepmd/pt_expt/fitting/polarizability_fitting.py
index 564df7e0d7..e86b1224ef 100644
--- a/deepmd/pt_expt/fitting/polarizability_fitting.py
+++ b/deepmd/pt_expt/fitting/polarizability_fitting.py
@@ -2,7 +2,6 @@
 
 from deepmd.dpmodel.fitting.polarizability_fitting import PolarFitting as PolarFittingDP
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 
@@ -15,9 +14,3 @@
 @torch_module
 class PolarFitting(PolarFittingDP):
     pass
-
-
-register_dpmodel_mapping(
-    PolarFittingDP,
-    lambda v: PolarFitting.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/fitting/property_fitting.py b/deepmd/pt_expt/fitting/property_fitting.py
index 318e30fad6..f1bd9becbf 100644
--- a/deepmd/pt_expt/fitting/property_fitting.py
+++ b/deepmd/pt_expt/fitting/property_fitting.py
@@ -4,7 +4,6 @@
     PropertyFittingNet as PropertyFittingNetDP,
 )
 from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
     torch_module,
 )
 
@@ -17,9 +16,3 @@
 @torch_module
 class PropertyFittingNet(PropertyFittingNetDP):
     pass
-
-
-register_dpmodel_mapping(
-    PropertyFittingNetDP,
-    lambda v: PropertyFittingNet.deserialize(v.serialize()),
-)

From 6d6adfe413931294e8064b7cc4bd39e19806fd65 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 23:17:22 +0800
Subject: [PATCH 06/63] remove the atomic model in pt_expt. mv atomic model's
 output stat tests to dpmodel's folder.

---
 deepmd/pt_expt/atomic_model/__init__.py       |   11 -
 .../pt_expt/atomic_model/dp_atomic_model.py   |   45 -
 .../atomic_model/energy_atomic_model.py       |   27 -
 deepmd/pt_expt/model/ener_model.py            |    6 +-
 .../dpmodel}/test_atomic_model_atomic_stat.py |  852 +++++-----
 .../dpmodel}/test_atomic_model_global_stat.py | 1388 ++++++++---------
 .../atomic_model/test_dp_atomic_model.py      |  288 ----
 7 files changed, 1013 insertions(+), 1604 deletions(-)
 delete mode 100644 deepmd/pt_expt/atomic_model/dp_atomic_model.py
 delete mode 100644 deepmd/pt_expt/atomic_model/energy_atomic_model.py
 rename source/tests/{pt_expt/atomic_model => common/dpmodel}/test_atomic_model_atomic_stat.py (56%)
 rename source/tests/{pt_expt/atomic_model => common/dpmodel}/test_atomic_model_global_stat.py (64%)
 delete mode 100644 source/tests/pt_expt/atomic_model/test_dp_atomic_model.py

diff --git a/deepmd/pt_expt/atomic_model/__init__.py b/deepmd/pt_expt/atomic_model/__init__.py
index 51ee9f4186..6ceb116d85 100644
--- a/deepmd/pt_expt/atomic_model/__init__.py
+++ b/deepmd/pt_expt/atomic_model/__init__.py
@@ -1,12 +1 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-from .dp_atomic_model import (
-    DPAtomicModel,
-)
-from .energy_atomic_model import (
-    DPEnergyAtomicModel,
-)
-
-__all__ = [
-    "DPAtomicModel",
-    "DPEnergyAtomicModel",
-]
diff --git a/deepmd/pt_expt/atomic_model/dp_atomic_model.py b/deepmd/pt_expt/atomic_model/dp_atomic_model.py
deleted file mode 100644
index b87935bd09..0000000000
--- a/deepmd/pt_expt/atomic_model/dp_atomic_model.py
+++ /dev/null
@@ -1,45 +0,0 @@
-# SPDX-License-Identifier: LGPL-3.0-or-later
-
-import torch
-
-from deepmd.dpmodel.atomic_model.dp_atomic_model import DPAtomicModel as DPAtomicModelDP
-from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
-    torch_module,
-)
-from deepmd.pt_expt.descriptor.base_descriptor import (
-    BaseDescriptor,
-)
-from deepmd.pt_expt.fitting.base_fitting import (
-    BaseFitting,
-)
-
-
-@torch_module
-class DPAtomicModel(DPAtomicModelDP):
-    base_descriptor_cls = BaseDescriptor
-    base_fitting_cls = BaseFitting
-
-    def forward(
-        self,
-        extended_coord: torch.Tensor,
-        extended_atype: torch.Tensor,
-        nlist: torch.Tensor,
-        mapping: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-    ) -> dict[str, torch.Tensor]:
-        return self.forward_atomic(
-            extended_coord,
-            extended_atype,
-            nlist,
-            mapping=mapping,
-            fparam=fparam,
-            aparam=aparam,
-        )
-
-
-register_dpmodel_mapping(
-    DPAtomicModelDP,
-    lambda v: DPAtomicModel.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/atomic_model/energy_atomic_model.py b/deepmd/pt_expt/atomic_model/energy_atomic_model.py
deleted file mode 100644
index 5f34d215cf..0000000000
--- a/deepmd/pt_expt/atomic_model/energy_atomic_model.py
+++ /dev/null
@@ -1,27 +0,0 @@
-# SPDX-License-Identifier: LGPL-3.0-or-later
-from deepmd.dpmodel.atomic_model.energy_atomic_model import (
-    DPEnergyAtomicModel as DPEnergyAtomicModelDP,
-)
-from deepmd.pt_expt.common import (
-    register_dpmodel_mapping,
-)
-
-from .dp_atomic_model import (
-    DPAtomicModel,
-)
-
-
-class DPEnergyAtomicModel(DPAtomicModel):
-    """Energy atomic model for pt_expt backend.
-
-    This is a thin wrapper around DPAtomicModel that validates
-    the fitting is an EnergyFittingNet or InvarFitting.
-    """
-
-    pass
-
-
-register_dpmodel_mapping(
-    DPEnergyAtomicModelDP,
-    lambda v: DPEnergyAtomicModel.deserialize(v.serialize()),
-)
diff --git a/deepmd/pt_expt/model/ener_model.py b/deepmd/pt_expt/model/ener_model.py
index fa07f3e3b2..0e5e81aebb 100644
--- a/deepmd/pt_expt/model/ener_model.py
+++ b/deepmd/pt_expt/model/ener_model.py
@@ -8,12 +8,12 @@
     make_fx,
 )
 
+from deepmd.dpmodel.atomic_model import (
+    DPEnergyAtomicModel,
+)
 from deepmd.dpmodel.model.dp_model import (
     DPModelCommon,
 )
-from deepmd.pt_expt.atomic_model import (
-    DPEnergyAtomicModel,
-)
 
 from .make_model import (
     make_model,
diff --git a/source/tests/pt_expt/atomic_model/test_atomic_model_atomic_stat.py b/source/tests/common/dpmodel/test_atomic_model_atomic_stat.py
similarity index 56%
rename from source/tests/pt_expt/atomic_model/test_atomic_model_atomic_stat.py
rename to source/tests/common/dpmodel/test_atomic_model_atomic_stat.py
index c393ad4b3b..572c4aa696 100644
--- a/source/tests/pt_expt/atomic_model/test_atomic_model_atomic_stat.py
+++ b/source/tests/common/dpmodel/test_atomic_model_atomic_stat.py
@@ -1,471 +1,381 @@
-# SPDX-License-Identifier: LGPL-3.0-or-later
-import tempfile
-import unittest
-from pathlib import (
-    Path,
-)
-from typing import (
-    NoReturn,
-)
-
-import h5py
-import numpy as np
-import torch
-
-from deepmd.dpmodel.output_def import (
-    FittingOutputDef,
-    OutputVariableDef,
-)
-from deepmd.pt_expt.atomic_model import (
-    DPAtomicModel,
-)
-from deepmd.pt_expt.descriptor.se_e2_a import (
-    DescrptSeA,
-)
-from deepmd.pt_expt.fitting.base_fitting import (
-    BaseFitting,
-)
-from deepmd.pt_expt.utils import (
-    env,
-)
-from deepmd.utils.path import (
-    DPPath,
-)
-
-from ...pt.model.test_env_mat import (
-    TestCaseSingleFrameWithNlist,
-)
-
-
-class FooFitting(BaseFitting, torch.nn.Module):
-    """Test fitting that returns fixed values for testing bias computation."""
-
-    def __init__(self):
-        torch.nn.Module.__init__(self)
-        BaseFitting.__init__(self)
-
-    def output_def(self):
-        return FittingOutputDef(
-            [
-                OutputVariableDef(
-                    "foo",
-                    [1],
-                    reducible=True,
-                    r_differentiable=True,
-                    c_differentiable=True,
-                ),
-                OutputVariableDef(
-                    "bar",
-                    [1, 2],
-                    reducible=True,
-                    r_differentiable=True,
-                    c_differentiable=True,
-                ),
-            ]
-        )
-
-    def serialize(self) -> dict:
-        return {
-            "@class": "Fitting",
-            "type": "foo",
-            "@version": 1,
-        }
-
-    @classmethod
-    def deserialize(cls, data: dict):
-        return cls()
-
-    def get_dim_fparam(self) -> int:
-        return 0
-
-    def get_dim_aparam(self) -> int:
-        return 0
-
-    def get_sel_type(self) -> list[int]:
-        return []
-
-    def change_type_map(
-        self, type_map: list[str], model_with_new_type_stat=None
-    ) -> None:
-        pass
-
-    def get_type_map(self) -> list[str]:
-        return []
-
-    def forward(
-        self,
-        descriptor: torch.Tensor,
-        atype: torch.Tensor,
-        gr: torch.Tensor | None = None,
-        g2: torch.Tensor | None = None,
-        h2: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-    ):
-        nf, nloc, _ = descriptor.shape
-        ret = {}
-        ret["foo"] = (
-            torch.Tensor(
-                [
-                    [1.0, 2.0, 3.0],
-                    [4.0, 5.0, 6.0],
-                ]
-            )
-            .view([nf, nloc, *self.output_def()["foo"].shape])
-            .to(dtype=torch.float64, device=env.DEVICE)
-        )
-        ret["bar"] = (
-            torch.Tensor(
-                [
-                    [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                    [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-                ]
-            )
-            .view([nf, nloc, *self.output_def()["bar"].shape])
-            .to(dtype=torch.float64, device=env.DEVICE)
-        )
-        return ret
-
-
-class TestAtomicModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def tearDown(self) -> None:
-        self.tempdir.cleanup()
-
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-        self.merged_output_stat = [
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32), device=self.device
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # bias of foo: 5, 6
-                "atom_foo": torch.tensor(
-                    np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(2, 3, 1),
-                    device=self.device,
-                ),
-                # bias of bar: [1, 5], [3, 2]
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2), device=self.device
-                ),
-                "find_atom_foo": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            },
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32), device=self.device
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # bias of foo: 5, 6 from atomic label.
-                "foo": torch.tensor(
-                    np.array([5.0, 7.0]).reshape(2, 1), device=self.device
-                ),
-                # bias of bar: [1, 5], [3, 2]
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2), device=self.device
-                ),
-                "find_foo": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            },
-        ]
-        self.tempdir = tempfile.TemporaryDirectory()
-        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
-        with h5py.File(h5file, "w") as f:
-            pass
-        self.stat_file_path = DPPath(h5file, "a")
-
-    def test_output_stat(self) -> None:
-        """Test output statistics computation for pt_expt atomic model."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        # nf x nloc
-        at = self.atype_ext[:, :nloc]
-
-        def cvt_ret(x):
-            return {kk: vv.detach().cpu().numpy() for kk, vv in x.items()}
-
-        # 1. test run without bias
-        # nf x na x odim
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-        expected_ret0 = {}
-        expected_ret0["foo"] = np.array(
-            [
-                [1.0, 2.0, 3.0],
-                [4.0, 5.0, 6.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
-        expected_ret0["bar"] = np.array(
-            [
-                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
-
-        # 2. test bias is applied
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        expected_std = np.ones(
-            (2, 2, 2), dtype=np.float64
-        )  # 2 keys, 2 atypes, 2 max dims.
-        expected_std[0, :, :1] = np.array([0.0, 0.816496]).reshape(
-            2, 1
-        )  # updating std for foo based on [5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]
-        np.testing.assert_almost_equal(
-            md0.out_std.detach().cpu().numpy(), expected_std, decimal=4
-        )
-        ret1 = cvt_ret(ret1)
-        # nt x odim
-        foo_bias = np.array([5.0, 6.0]).reshape(2, 1)
-        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
-        expected_ret1 = {}
-        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
-        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
-
-        # 3. test bias load from file
-        def raise_error() -> NoReturn:
-            raise RuntimeError
-
-        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
-        ret2 = md0.forward_common_atomic(*args)
-        ret2 = cvt_ret(ret2)
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
-        np.testing.assert_almost_equal(
-            md0.out_std.detach().cpu().numpy(), expected_std, decimal=4
-        )
-
-        # 4. test change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        # use atype_ext from merged_output_stat for inference (matching pt backend test)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            self.merged_output_stat[0]["atype_ext"].to(
-                dtype=torch.int64, device=self.device
-            ),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret3 = md0.forward_common_atomic(*args)
-        ret3 = cvt_ret(ret3)
-        expected_std[0, :, :1] = np.array([1.24722, 0.47140]).reshape(
-            2, 1
-        )  # updating std for foo based on [4.0, 3.0, 2.0], [1.0, 1.0, 1.0]]
-        expected_ret3 = {}
-        # new bias [2.666, 1.333]
-        expected_ret3["foo"] = np.array(
-            [[3.6667, 4.6667, 4.3333], [6.6667, 6.3333, 7.3333]]
-        ).reshape(2, 3, 1)
-        for kk in ["foo"]:
-            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
-        np.testing.assert_almost_equal(
-            md0.out_std.detach().cpu().numpy(), expected_std, decimal=4
-        )
-
-
-class TestAtomicModelStatMergeGlobalAtomic(
-    unittest.TestCase, TestCaseSingleFrameWithNlist
-):
-    """Test merging atomic and global stat when atomic label only covers some types."""
-
-    def tearDown(self) -> None:
-        self.tempdir.cleanup()
-
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-        self.merged_output_stat = [
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 0], [0, 0, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # bias of foo: 5.5, nan (only type 0 atoms)
-                "atom_foo": torch.tensor(
-                    np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(2, 3, 1),
-                    device=self.device,
-                ),
-                # bias of bar: [1, 5], [3, 2]
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
-                    device=self.device,
-                ),
-                "find_atom_foo": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            },
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # bias of foo: 5.5, 3 from global label.
-                "foo": torch.tensor(
-                    np.array([5.0, 7.0]).reshape(2, 1), device=self.device
-                ),
-                # bias of bar: [1, 5], [3, 2]
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
-                    device=self.device,
-                ),
-                "find_foo": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            },
-        ]
-        self.tempdir = tempfile.TemporaryDirectory()
-        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
-        with h5py.File(h5file, "w") as f:
-            pass
-        self.stat_file_path = DPPath(h5file, "a")
-
-    def test_output_stat(self) -> None:
-        """Test merging atomic (type 0 only) and global stat for type 1."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        # nf x nloc
-        at = self.atype_ext[:, :nloc]
-
-        def cvt_ret(x):
-            return {kk: vv.detach().cpu().numpy() for kk, vv in x.items()}
-
-        # 1. test run without bias
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-        expected_ret0 = {}
-        expected_ret0["foo"] = np.array(
-            [
-                [1.0, 2.0, 3.0],
-                [4.0, 5.0, 6.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
-        expected_ret0["bar"] = np.array(
-            [
-                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
-
-        # 2. test bias is applied
-        # foo: type 0 from atomic (mean=5.5), type 1 from global (lstsq=3.0)
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        ret1 = cvt_ret(ret1)
-        # nt x odim
-        foo_bias = np.array([5.5, 3.0]).reshape(2, 1)
-        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
-        expected_ret1 = {}
-        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
-        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
-
-        # 3. test bias load from file
-        def raise_error() -> NoReturn:
-            raise RuntimeError
-
-        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
-        ret2 = md0.forward_common_atomic(*args)
-        ret2 = cvt_ret(ret2)
-        for kk in ["foo", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
-
-        # 4. test change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        # use atype_ext from merged_output_stat for inference
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            self.merged_output_stat[0]["atype_ext"].to(
-                dtype=torch.int64, device=self.device
-            ),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret3 = md0.forward_common_atomic(*args)
-        ret3 = cvt_ret(ret3)
-        expected_ret3 = {}
-        # new bias [2, -5]
-        expected_ret3["foo"] = np.array([[3, 4, -2], [6, 0, 1]]).reshape(2, 3, 1)
-        for kk in ["foo"]:
-            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import tempfile
+import unittest
+from pathlib import (
+    Path,
+)
+from typing import (
+    NoReturn,
+)
+
+import h5py
+import numpy as np
+
+from deepmd.dpmodel.atomic_model import (
+    DPAtomicModel,
+)
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.dpmodel.fitting.base_fitting import (
+    BaseFitting,
+)
+from deepmd.dpmodel.output_def import (
+    FittingOutputDef,
+    OutputVariableDef,
+)
+from deepmd.utils.path import (
+    DPPath,
+)
+
+from .case_single_frame_with_nlist import (
+    TestCaseSingleFrameWithNlist,
+)
+
+
+class FooFitting(NativeOP, BaseFitting):
+    """Test fitting that returns fixed values for testing bias computation."""
+
+    def __init__(self):
+        pass
+
+    def output_def(self):
+        return FittingOutputDef(
+            [
+                OutputVariableDef(
+                    "foo",
+                    [1],
+                    reducible=True,
+                    r_differentiable=True,
+                    c_differentiable=True,
+                ),
+                OutputVariableDef(
+                    "bar",
+                    [1, 2],
+                    reducible=True,
+                    r_differentiable=True,
+                    c_differentiable=True,
+                ),
+            ]
+        )
+
+    def serialize(self) -> dict:
+        return {
+            "@class": "Fitting",
+            "type": "foo",
+            "@version": 1,
+        }
+
+    @classmethod
+    def deserialize(cls, data: dict):
+        return cls()
+
+    def get_dim_fparam(self) -> int:
+        return 0
+
+    def get_dim_aparam(self) -> int:
+        return 0
+
+    def get_sel_type(self) -> list[int]:
+        return []
+
+    def change_type_map(
+        self, type_map: list[str], model_with_new_type_stat=None
+    ) -> None:
+        pass
+
+    def get_type_map(self) -> list[str]:
+        return []
+
+    def call(
+        self,
+        descriptor,
+        atype,
+        gr=None,
+        g2=None,
+        h2=None,
+        fparam=None,
+        aparam=None,
+    ):
+        nf, nloc, _ = descriptor.shape
+        ret = {}
+        ret["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *self.output_def()["foo"].shape])
+        ret["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *self.output_def()["bar"].shape])
+        return ret
+
+
+class TestAtomicModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def tearDown(self) -> None:
+        self.tempdir.cleanup()
+
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.merged_output_stat = [
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # bias of foo: 5, 6
+                "atom_foo": np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(
+                    2, 3, 1
+                ),
+                # bias of bar: [1, 5], [3, 2]
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_atom_foo": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            },
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # bias of foo: 5.5, 3 from global label.
+                "foo": np.array([5.0, 7.0]).reshape(2, 1),
+                # bias of bar: [1, 5], [3, 2]
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_foo": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            },
+        ]
+        self.tempdir = tempfile.TemporaryDirectory()
+        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
+        with h5py.File(h5file, "w") as f:
+            pass
+        self.stat_file_path = DPPath(h5file, "a")
+
+    def test_output_stat(self) -> None:
+        """Test output statistics computation for dpmodel atomic model."""
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        md0 = DPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+        # nf x nloc
+        at = self.atype_ext[:, :nloc]
+
+        # 1. test run without bias
+        # nf x na x odim
+        ret0 = md0.forward_common_atomic(*args)
+        expected_ret0 = {}
+        expected_ret0["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
+        expected_ret0["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
+
+        # 2. test bias is applied
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        expected_std = np.ones(
+            (2, 2, 2), dtype=np.float64
+        )  # 2 keys, 2 atypes, 2 max dims.
+        expected_std[0, :, :1] = np.array([0.0, 0.816496]).reshape(
+            2, 1
+        )  # updating std for foo based on [5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]
+        np.testing.assert_almost_equal(md0.out_std, expected_std, decimal=4)
+        # nt x odim
+        foo_bias = np.array([5.0, 6.0]).reshape(2, 1)
+        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
+        expected_ret1 = {}
+        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
+        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
+
+        # 3. test bias load from file
+        def raise_error() -> NoReturn:
+            raise RuntimeError
+
+        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
+        ret2 = md0.forward_common_atomic(*args)
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
+        np.testing.assert_almost_equal(md0.out_std, expected_std, decimal=4)
+
+        # 4. test change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        # use atype_ext from merged_output_stat for inference (matching pt backend test)
+        args = [
+            self.coord_ext,
+            np.array(self.merged_output_stat[0]["atype_ext"], dtype=np.int64),
+            self.nlist,
+        ]
+        ret3 = md0.forward_common_atomic(*args)
+        expected_std[0, :, :1] = np.array([1.24722, 0.47140]).reshape(
+            2, 1
+        )  # updating std for foo based on [4.0, 3.0, 2.0], [1.0, 1.0, 1.0]]
+        expected_ret3 = {}
+        # new bias [2.666, 1.333]
+        expected_ret3["foo"] = np.array(
+            [[3.6667, 4.6667, 4.3333], [6.6667, 6.3333, 7.3333]]
+        ).reshape(2, 3, 1)
+        for kk in ["foo"]:
+            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
+        np.testing.assert_almost_equal(md0.out_std, expected_std, decimal=4)
+
+
+class TestAtomicModelStatMergeGlobalAtomic(
+    unittest.TestCase, TestCaseSingleFrameWithNlist
+):
+    """Test merging atomic and global stat when atomic label only covers some types."""
+
+    def tearDown(self) -> None:
+        self.tempdir.cleanup()
+
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.merged_output_stat = [
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 0], [0, 0, 0]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # bias of foo: 5.5, nan (only type 0 atoms)
+                "atom_foo": np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(
+                    2, 3, 1
+                ),
+                # bias of bar: [1, 5], [3, 2]
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_atom_foo": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            },
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # bias of foo: 5.5, 3 from global label.
+                "foo": np.array([5.0, 7.0]).reshape(2, 1),
+                # bias of bar: [1, 5], [3, 2]
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_foo": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            },
+        ]
+        self.tempdir = tempfile.TemporaryDirectory()
+        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
+        with h5py.File(h5file, "w") as f:
+            pass
+        self.stat_file_path = DPPath(h5file, "a")
+
+    def test_output_stat(self) -> None:
+        """Test merging atomic (type 0 only) and global stat for type 1."""
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        md0 = DPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+        # nf x nloc
+        at = self.atype_ext[:, :nloc]
+
+        # 1. test run without bias
+        ret0 = md0.forward_common_atomic(*args)
+        expected_ret0 = {}
+        expected_ret0["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
+        expected_ret0["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
+
+        # 2. test bias is applied
+        # foo: type 0 from atomic (mean=5.5), type 1 from global (lstsq=3.0)
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        # nt x odim
+        foo_bias = np.array([5.5, 3.0]).reshape(2, 1)
+        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
+        expected_ret1 = {}
+        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
+        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
+
+        # 3. test bias load from file
+        def raise_error() -> NoReturn:
+            raise RuntimeError
+
+        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
+        ret2 = md0.forward_common_atomic(*args)
+        for kk in ["foo", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
+
+        # 4. test change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        # use atype_ext from merged_output_stat for inference
+        args = [
+            self.coord_ext,
+            np.array(self.merged_output_stat[0]["atype_ext"], dtype=np.int64),
+            self.nlist,
+        ]
+        ret3 = md0.forward_common_atomic(*args)
+        expected_ret3 = {}
+        # new bias [2, -5]
+        expected_ret3["foo"] = np.array([[3, 4, -2], [6, 0, 1]]).reshape(2, 3, 1)
+        for kk in ["foo"]:
+            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/atomic_model/test_atomic_model_global_stat.py b/source/tests/common/dpmodel/test_atomic_model_global_stat.py
similarity index 64%
rename from source/tests/pt_expt/atomic_model/test_atomic_model_global_stat.py
rename to source/tests/common/dpmodel/test_atomic_model_global_stat.py
index e09e7c0c91..88470a57c9 100644
--- a/source/tests/pt_expt/atomic_model/test_atomic_model_global_stat.py
+++ b/source/tests/common/dpmodel/test_atomic_model_global_stat.py
@@ -1,759 +1,629 @@
-# SPDX-License-Identifier: LGPL-3.0-or-later
-import tempfile
-import unittest
-from pathlib import (
-    Path,
-)
-from typing import (
-    NoReturn,
-)
-
-import h5py
-import numpy as np
-import torch
-
-from deepmd.dpmodel.atomic_model import DPAtomicModel as DPDPAtomicModel
-from deepmd.dpmodel.output_def import (
-    FittingOutputDef,
-    OutputVariableDef,
-)
-from deepmd.pt_expt.atomic_model import (
-    DPAtomicModel,
-)
-from deepmd.pt_expt.descriptor.se_e2_a import (
-    DescrptSeA,
-)
-from deepmd.pt_expt.fitting import (
-    InvarFitting,
-)
-from deepmd.pt_expt.fitting.base_fitting import (
-    BaseFitting,
-)
-from deepmd.pt_expt.utils import (
-    env,
-)
-from deepmd.utils.path import (
-    DPPath,
-)
-
-from ...pt.model.test_env_mat import (
-    TestCaseSingleFrameWithNlist,
-)
-from ...seed import (
-    GLOBAL_SEED,
-)
-
-
-class FooFitting(BaseFitting, torch.nn.Module):
-    """Test fitting with multiple outputs for testing global statistics."""
-
-    def __init__(self):
-        torch.nn.Module.__init__(self)
-        BaseFitting.__init__(self)
-
-    def output_def(self):
-        return FittingOutputDef(
-            [
-                OutputVariableDef(
-                    "foo",
-                    [1],
-                    reducible=True,
-                    r_differentiable=True,
-                    c_differentiable=True,
-                ),
-                OutputVariableDef(
-                    "pix",
-                    [1],
-                    reducible=True,
-                    r_differentiable=True,
-                    c_differentiable=True,
-                ),
-                OutputVariableDef(
-                    "bar",
-                    [1, 2],
-                    reducible=True,
-                    r_differentiable=True,
-                    c_differentiable=True,
-                ),
-            ]
-        )
-
-    def serialize(self) -> dict:
-        return {
-            "@class": "Fitting",
-            "type": "foo",
-            "@version": 1,
-        }
-
-    @classmethod
-    def deserialize(cls, data: dict):
-        return cls()
-
-    def get_dim_fparam(self) -> int:
-        return 0
-
-    def get_dim_aparam(self) -> int:
-        return 0
-
-    def get_sel_type(self) -> list[int]:
-        return []
-
-    def change_type_map(
-        self, type_map: list[str], model_with_new_type_stat=None
-    ) -> None:
-        pass
-
-    def get_type_map(self) -> list[str]:
-        return []
-
-    def forward(
-        self,
-        descriptor: torch.Tensor,
-        atype: torch.Tensor,
-        gr: torch.Tensor | None = None,
-        g2: torch.Tensor | None = None,
-        h2: torch.Tensor | None = None,
-        fparam: torch.Tensor | None = None,
-        aparam: torch.Tensor | None = None,
-    ):
-        nf, nloc, _ = descriptor.shape
-        ret = {}
-        ret["foo"] = (
-            torch.Tensor(
-                [
-                    [1.0, 2.0, 3.0],
-                    [4.0, 5.0, 6.0],
-                ]
-            )
-            .view([nf, nloc, *self.output_def()["foo"].shape])
-            .to(dtype=torch.float64, device=env.DEVICE)
-        )
-        ret["pix"] = (
-            torch.Tensor(
-                [
-                    [3.0, 2.0, 1.0],
-                    [6.0, 5.0, 4.0],
-                ]
-            )
-            .view([nf, nloc, *self.output_def()["pix"].shape])
-            .to(dtype=torch.float64, device=env.DEVICE)
-        )
-        ret["bar"] = (
-            torch.Tensor(
-                [
-                    [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                    [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-                ]
-            )
-            .view([nf, nloc, *self.output_def()["bar"].shape])
-            .to(dtype=torch.float64, device=env.DEVICE)
-        )
-        return ret
-
-
-def _to_numpy(x):
-    return x.detach().cpu().numpy()
-
-
-class TestAtomicModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def tearDown(self) -> None:
-        self.tempdir.cleanup()
-
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-        self.merged_output_stat = [
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # bias of foo: 1, 3
-                "foo": torch.tensor(
-                    np.array([5.0, 7.0]).reshape(2, 1), device=self.device
-                ),
-                # no bias of pix
-                # bias of bar: [1, 5], [3, 2]
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
-                    device=self.device,
-                ),
-                "find_foo": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            }
-        ]
-        self.tempdir = tempfile.TemporaryDirectory()
-        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
-        with h5py.File(h5file, "w") as f:
-            pass
-        self.stat_file_path = DPPath(h5file, "a")
-
-    def test_output_stat(self) -> None:
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        # nf x nloc
-        at = self.atype_ext[:, :nloc]
-
-        def cvt_ret(x):
-            return {kk: _to_numpy(vv) for kk, vv in x.items()}
-
-        # 1. test run without bias
-        # nf x na x odim
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-
-        expected_ret0 = {}
-        expected_ret0["foo"] = np.array(
-            [
-                [1.0, 2.0, 3.0],
-                [4.0, 5.0, 6.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
-        expected_ret0["pix"] = np.array(
-            [
-                [3.0, 2.0, 1.0],
-                [6.0, 5.0, 4.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
-        expected_ret0["bar"] = np.array(
-            [
-                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
-
-        # 2. test bias is applied
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        ret1 = cvt_ret(ret1)
-        expected_std = np.ones((3, 2, 2))  # 3 keys, 2 atypes, 2 max dims.
-        # nt x odim
-        foo_bias = np.array([1.0, 3.0]).reshape(2, 1)
-        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
-        expected_ret1 = {}
-        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
-        expected_ret1["pix"] = ret0["pix"]
-        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
-        np.testing.assert_almost_equal(_to_numpy(md0.out_std), expected_std)
-
-        # 3. test bias load from file
-        def raise_error() -> NoReturn:
-            raise RuntimeError
-
-        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
-        ret2 = md0.forward_common_atomic(*args)
-        ret2 = cvt_ret(ret2)
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
-        np.testing.assert_almost_equal(_to_numpy(md0.out_std), expected_std)
-
-        # 4. test change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        # use atype_ext from merged_output_stat for inference (matching pt backend test)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            self.merged_output_stat[0]["atype_ext"].to(
-                dtype=torch.int64, device=self.device
-            ),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret3 = md0.forward_common_atomic(*args)
-        ret3 = cvt_ret(ret3)
-        ## model output on foo: [[2, 3, 6], [5, 8, 9]] given bias [1, 3]
-        ## foo sumed: [11, 22] compared with [5, 7], fit target is [-6, -15]
-        ## fit bias is [1, -8]
-        ## old bias + fit bias [2, -5]
-        ## new model output is [[3, 4, -2], [6, 0, 1]], which sumed to [5, 7]
-        expected_ret3 = {}
-        expected_ret3["foo"] = np.array([[3, 4, -2], [6, 0, 1]]).reshape(2, 3, 1)
-        expected_ret3["pix"] = ret0["pix"]
-        for kk in ["foo", "pix"]:
-            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk])
-        # bar is too complicated to be manually computed.
-        np.testing.assert_almost_equal(_to_numpy(md0.out_std), expected_std)
-
-    def test_preset_bias(self) -> None:
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        preset_out_bias = {
-            "foo": [None, 2],
-            "bar": np.array([7.0, 5.0, 13.0, 11.0]).reshape(2, 1, 2),
-        }
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-            preset_out_bias=preset_out_bias,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        # nf x nloc
-        at = self.atype_ext[:, :nloc]
-
-        def cvt_ret(x):
-            return {kk: _to_numpy(vv) for kk, vv in x.items()}
-
-        # 1. test run without bias
-        # nf x na x odim
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-        expected_ret0 = {}
-        expected_ret0["foo"] = np.array(
-            [
-                [1.0, 2.0, 3.0],
-                [4.0, 5.0, 6.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
-        expected_ret0["pix"] = np.array(
-            [
-                [3.0, 2.0, 1.0],
-                [6.0, 5.0, 4.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
-        expected_ret0["bar"] = np.array(
-            [
-                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
-
-        # 2. test bias is applied
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        ret1 = cvt_ret(ret1)
-        # foo sums: [5, 7],
-        # given bias of type 1 being 2, the bias left for type 0 is [5-2*1, 7-2*2] = [3,3]
-        # the solution of type 0 is 1.8
-        foo_bias = np.array([1.8, preset_out_bias["foo"][1]]).reshape(2, 1)
-        bar_bias = preset_out_bias["bar"]
-        expected_ret1 = {}
-        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
-        expected_ret1["pix"] = ret0["pix"]
-        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
-
-        # 3. test bias load from file
-        def raise_error() -> NoReturn:
-            raise RuntimeError
-
-        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
-        ret2 = md0.forward_common_atomic(*args)
-        ret2 = cvt_ret(ret2)
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
-
-        # 4. test change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        # use atype_ext from merged_output_stat for inference
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            self.merged_output_stat[0]["atype_ext"].to(
-                dtype=torch.int64, device=self.device
-            ),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret3 = md0.forward_common_atomic(*args)
-        ret3 = cvt_ret(ret3)
-        ## model output on foo: [[2.8, 3.8, 5], [5.8, 7., 8.]] given bias [1.8, 2]
-        ## foo sumed: [11.6, 20.8] compared with [5, 7], fit target is [-6.6, -13.8]
-        ## fit bias is [-7, 2] (2 is assigned. -7 is fit to [-8.6, -17.8])
-        ## old bias[1.8,2] + fit bias[-7, 2] = [-5.2, 4]
-        ## new model output is [[-4.2, -3.2, 7], [-1.2, 9, 10]]
-        expected_ret3 = {}
-        expected_ret3["foo"] = np.array([[-4.2, -3.2, 7.0], [-1.2, 9.0, 10.0]]).reshape(
-            2, 3, 1
-        )
-        expected_ret3["pix"] = ret0["pix"]
-        for kk in ["foo", "pix"]:
-            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk])
-        # bar is too complicated to be manually computed.
-
-    def test_preset_bias_all_none(self) -> None:
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        preset_out_bias = {
-            "foo": [None, None],
-        }
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-            preset_out_bias=preset_out_bias,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        # nf x nloc
-        at = self.atype_ext[:, :nloc]
-
-        def cvt_ret(x):
-            return {kk: _to_numpy(vv) for kk, vv in x.items()}
-
-        # 1. test run without bias
-        # nf x na x odim
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-        expected_ret0 = {}
-        expected_ret0["foo"] = np.array(
-            [
-                [1.0, 2.0, 3.0],
-                [4.0, 5.0, 6.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
-        expected_ret0["pix"] = np.array(
-            [
-                [3.0, 2.0, 1.0],
-                [6.0, 5.0, 4.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
-        expected_ret0["bar"] = np.array(
-            [
-                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
-                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
-            ]
-        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
-
-        # 2. test bias is applied (all None preset = same as no preset)
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        ret1 = cvt_ret(ret1)
-        # nt x odim
-        foo_bias = np.array([1.0, 3.0]).reshape(2, 1)
-        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
-        expected_ret1 = {}
-        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
-        expected_ret1["pix"] = ret0["pix"]
-        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
-        for kk in ["foo", "pix", "bar"]:
-            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
-
-    def test_serialize(self) -> None:
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = InvarFitting(
-            "foo",
-            self.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        ).to(self.device)
-        type_map = ["A", "B"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-
-        def cvt_ret(x):
-            return {kk: _to_numpy(vv) for kk, vv in x.items()}
-
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-        md1 = DPAtomicModel.deserialize(md0.serialize())
-        ret1 = md1.forward_common_atomic(*args)
-        ret1 = cvt_ret(ret1)
-
-        for kk in ["foo"]:
-            np.testing.assert_almost_equal(ret0[kk], ret1[kk])
-
-        md2 = DPDPAtomicModel.deserialize(md0.serialize())
-        args_np = [self.coord_ext, self.atype_ext, self.nlist]
-        ret2 = md2.forward_common_atomic(*args_np)
-        for kk in ["foo"]:
-            np.testing.assert_almost_equal(ret0[kk], ret2[kk])
-
-
-class TestChangeByStatMixedLabels(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    """Test change-by-statistic with mixed atomic and global labels."""
-
-    def tearDown(self) -> None:
-        self.tempdir.cleanup()
-
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-        self.merged_output_stat = [
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # foo: atomic label
-                "atom_foo": torch.tensor(
-                    np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(2, 3, 1),
-                    device=self.device,
-                ),
-                # pix: global label
-                "pix": torch.tensor(
-                    np.array([5.0, 12.0]).reshape(2, 1), device=self.device
-                ),
-                # bar: global label
-                "bar": torch.tensor(
-                    np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
-                    device=self.device,
-                ),
-                "find_atom_foo": np.float32(1.0),
-                "find_pix": np.float32(1.0),
-                "find_bar": np.float32(1.0),
-            },
-        ]
-        self.tempdir = tempfile.TemporaryDirectory()
-        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
-        with h5py.File(h5file, "w") as f:
-            pass
-        self.stat_file_path = DPPath(h5file, "a")
-
-    def test_change_by_statistic(self) -> None:
-        """Test change-by-statistic with atomic foo + global pix + global bar."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = FooFitting().to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-
-        def cvt_ret(x):
-            return {kk: _to_numpy(vv) for kk, vv in x.items()}
-
-        ret0 = md0.forward_common_atomic(*args)
-        ret0 = cvt_ret(ret0)
-
-        # set initial bias
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-
-        # change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        # use atype_ext from merged_output_stat for inference
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            self.merged_output_stat[0]["atype_ext"].to(
-                dtype=torch.int64, device=self.device
-            ),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret3 = md0.forward_common_atomic(*args)
-        ret3 = cvt_ret(ret3)
-        # foo: atomic label, bias after set-by-stat: [5, 6]
-        # model output with bias [5,6], atype [[0,0,1],[0,1,1]]:
-        #   [[6, 7, 9], [9, 11, 12]]
-        # atom_foo labels: [[5, 5, 5], [5, 6, 7]]
-        # per-atom delta: [[-1, -2, -4], [-4, -5, -5]]
-        # delta bias (mean per type): type0=-7/3, type1=-14/3
-        # new bias = [5-7/3, 6-14/3] = [8/3, 4/3]
-        # new output: [[11/3, 14/3, 13/3], [20/3, 19/3, 22/3]]
-        expected_ret3 = {}
-        expected_ret3["foo"] = np.array(
-            [[3.6667, 4.6667, 4.3333], [6.6667, 6.3333, 7.3333]]
-        ).reshape(2, 3, 1)
-        # pix: global label, bias after set-by-stat: [-2/3, 19/3]
-        # model pix with bias, atype [[0,0,1],[0,1,1]]:
-        #   [[7/3, 4/3, 22/3], [16/3, 34/3, 31/3]], sums [11, 27]
-        # labels [5, 12], delta [-6, -15]
-        # lstsq: delta bias [1, -8], new bias [1/3, -5/3]
-        # new output: [[10/3, 7/3, -2/3], [19/3, 10/3, 7/3]]
-        expected_ret3["pix"] = np.array(
-            [[3.3333, 2.3333, -0.6667], [6.3333, 3.3333, 2.3333]]
-        ).reshape(2, 3, 1)
-        for kk in ["foo", "pix"]:
-            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
-        # bar is too complicated to be manually computed.
-
-
-class TestEnergyModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    """Test statistics computation with real energy fitting net."""
-
-    def tearDown(self) -> None:
-        self.tempdir.cleanup()
-
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-        self.merged_output_stat = [
-            {
-                "coord": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "atype": torch.tensor(
-                    np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "atype_ext": torch.tensor(
-                    np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
-                    device=self.device,
-                ),
-                "box": torch.tensor(np.zeros([2, 3, 3]), device=self.device),
-                "natoms": torch.tensor(
-                    np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
-                    device=self.device,
-                ),
-                # energy data
-                "energy": torch.tensor(
-                    np.array([10.0, 20.0]).reshape(2, 1), device=self.device
-                ),
-                "find_energy": np.float32(1.0),
-            },
-        ]
-        self.tempdir = tempfile.TemporaryDirectory()
-        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
-        with h5py.File(h5file, "w") as f:
-            pass
-        self.stat_file_path = DPPath(h5file, "a")
-
-    def test_energy_stat(self) -> None:
-        """Test energy statistics computation with real energy fitting net."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = InvarFitting(
-            "energy",
-            self.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        ).to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(
-            ds,
-            ft,
-            type_map=type_map,
-        ).to(self.device)
-        args = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-
-        # test run without bias
-        ret0 = md0.forward_common_atomic(*args)
-        self.assertIn("energy", ret0)
-
-        # compute statistics
-        md0.compute_or_load_out_stat(
-            self.merged_output_stat, stat_file_path=self.stat_file_path
-        )
-        ret1 = md0.forward_common_atomic(*args)
-        self.assertIn("energy", ret1)
-
-        # Check that bias was computed (out_bias should be non-zero)
-        self.assertFalse(torch.all(md0.out_bias == 0))
-
-        # test bias load from file
-        def raise_error() -> NoReturn:
-            raise RuntimeError
-
-        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
-        ret2 = md0.forward_common_atomic(*args)
-        np.testing.assert_allclose(
-            ret1["energy"].detach().cpu().numpy(),
-            ret2["energy"].detach().cpu().numpy(),
-        )
-
-        # test change bias
-        md0.change_out_bias(
-            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
-        )
-        ret3 = md0.forward_common_atomic(*args)
-        self.assertIn("energy", ret3)
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import tempfile
+import unittest
+from pathlib import (
+    Path,
+)
+from typing import (
+    NoReturn,
+)
+
+import h5py
+import numpy as np
+
+from deepmd.dpmodel.atomic_model import DPAtomicModel as DPDPAtomicModel
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
+from deepmd.dpmodel.descriptor import (
+    DescrptSeA,
+)
+from deepmd.dpmodel.fitting import (
+    InvarFitting,
+)
+from deepmd.dpmodel.fitting.base_fitting import (
+    BaseFitting,
+)
+from deepmd.dpmodel.output_def import (
+    FittingOutputDef,
+    OutputVariableDef,
+)
+from deepmd.utils.path import (
+    DPPath,
+)
+
+from .case_single_frame_with_nlist import (
+    TestCaseSingleFrameWithNlist,
+)
+
+
+class FooFitting(NativeOP, BaseFitting):
+    """Test fitting with multiple outputs for testing global statistics."""
+
+    def __init__(self):
+        pass
+
+    def output_def(self):
+        return FittingOutputDef(
+            [
+                OutputVariableDef(
+                    "foo",
+                    [1],
+                    reducible=True,
+                    r_differentiable=True,
+                    c_differentiable=True,
+                ),
+                OutputVariableDef(
+                    "pix",
+                    [1],
+                    reducible=True,
+                    r_differentiable=True,
+                    c_differentiable=True,
+                ),
+                OutputVariableDef(
+                    "bar",
+                    [1, 2],
+                    reducible=True,
+                    r_differentiable=True,
+                    c_differentiable=True,
+                ),
+            ]
+        )
+
+    def serialize(self) -> dict:
+        return {
+            "@class": "Fitting",
+            "type": "foo",
+            "@version": 1,
+        }
+
+    @classmethod
+    def deserialize(cls, data: dict):
+        return cls()
+
+    def get_dim_fparam(self) -> int:
+        return 0
+
+    def get_dim_aparam(self) -> int:
+        return 0
+
+    def get_sel_type(self) -> list[int]:
+        return []
+
+    def change_type_map(
+        self, type_map: list[str], model_with_new_type_stat=None
+    ) -> None:
+        pass
+
+    def get_type_map(self) -> list[str]:
+        return []
+
+    def call(
+        self,
+        descriptor,
+        atype,
+        gr=None,
+        g2=None,
+        h2=None,
+        fparam=None,
+        aparam=None,
+    ):
+        nf, nloc, _ = descriptor.shape
+        ret = {}
+        ret["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *self.output_def()["foo"].shape])
+        ret["pix"] = np.array(
+            [
+                [3.0, 2.0, 1.0],
+                [6.0, 5.0, 4.0],
+            ]
+        ).reshape([nf, nloc, *self.output_def()["pix"].shape])
+        ret["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *self.output_def()["bar"].shape])
+        return ret
+
+
+class TestAtomicModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    def tearDown(self) -> None:
+        self.tempdir.cleanup()
+
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.merged_output_stat = [
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # bias of foo: 1, 3
+                "foo": np.array([5.0, 7.0]).reshape(2, 1),
+                # no bias of pix
+                # bias of bar: [1, 5], [3, 2]
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_foo": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            }
+        ]
+        self.tempdir = tempfile.TemporaryDirectory()
+        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
+        with h5py.File(h5file, "w") as f:
+            pass
+        self.stat_file_path = DPPath(h5file, "a")
+
+    def test_output_stat(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+        # nf x nloc
+        at = self.atype_ext[:, :nloc]
+
+        # 1. test run without bias
+        # nf x na x odim
+        ret0 = md0.forward_common_atomic(*args)
+
+        expected_ret0 = {}
+        expected_ret0["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
+        expected_ret0["pix"] = np.array(
+            [
+                [3.0, 2.0, 1.0],
+                [6.0, 5.0, 4.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
+        expected_ret0["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
+
+        # 2. test bias is applied
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        expected_std = np.ones((3, 2, 2))  # 3 keys, 2 atypes, 2 max dims.
+        # nt x odim
+        foo_bias = np.array([1.0, 3.0]).reshape(2, 1)
+        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
+        expected_ret1 = {}
+        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
+        expected_ret1["pix"] = ret0["pix"]
+        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
+        np.testing.assert_almost_equal(md0.out_std, expected_std)
+
+        # 3. test bias load from file
+        def raise_error() -> NoReturn:
+            raise RuntimeError
+
+        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
+        ret2 = md0.forward_common_atomic(*args)
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
+        np.testing.assert_almost_equal(md0.out_std, expected_std)
+
+        # 4. test change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        # use atype_ext from merged_output_stat for inference
+        args = [
+            self.coord_ext,
+            np.array(self.merged_output_stat[0]["atype_ext"], dtype=np.int64),
+            self.nlist,
+        ]
+        ret3 = md0.forward_common_atomic(*args)
+        ## model output on foo: [[2, 3, 6], [5, 8, 9]] given bias [1, 3]
+        ## foo sumed: [11, 22] compared with [5, 7], fit target is [-6, -15]
+        ## fit bias is [1, -8]
+        ## old bias + fit bias [2, -5]
+        ## new model output is [[3, 4, -2], [6, 0, 1]], which sumed to [5, 7]
+        expected_ret3 = {}
+        expected_ret3["foo"] = np.array([[3, 4, -2], [6, 0, 1]]).reshape(2, 3, 1)
+        expected_ret3["pix"] = ret0["pix"]
+        for kk in ["foo", "pix"]:
+            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk])
+        # bar is too complicated to be manually computed.
+        np.testing.assert_almost_equal(md0.out_std, expected_std)
+
+    def test_preset_bias(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        preset_out_bias = {
+            "foo": [None, 2],
+            "bar": np.array([7.0, 5.0, 13.0, 11.0]).reshape(2, 1, 2),
+        }
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+            preset_out_bias=preset_out_bias,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+        # nf x nloc
+        at = self.atype_ext[:, :nloc]
+
+        # 1. test run without bias
+        # nf x na x odim
+        ret0 = md0.forward_common_atomic(*args)
+        expected_ret0 = {}
+        expected_ret0["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
+        expected_ret0["pix"] = np.array(
+            [
+                [3.0, 2.0, 1.0],
+                [6.0, 5.0, 4.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
+        expected_ret0["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
+
+        # 2. test bias is applied
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        # foo sums: [5, 7],
+        # given bias of type 1 being 2, the bias left for type 0 is [5-2*1, 7-2*2] = [3,3]
+        # the solution of type 0 is 1.8
+        foo_bias = np.array([1.8, preset_out_bias["foo"][1]]).reshape(2, 1)
+        bar_bias = preset_out_bias["bar"]
+        expected_ret1 = {}
+        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
+        expected_ret1["pix"] = ret0["pix"]
+        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
+
+        # 3. test bias load from file
+        def raise_error() -> NoReturn:
+            raise RuntimeError
+
+        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
+        ret2 = md0.forward_common_atomic(*args)
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], ret2[kk])
+
+        # 4. test change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        # use atype_ext from merged_output_stat for inference
+        args = [
+            self.coord_ext,
+            np.array(self.merged_output_stat[0]["atype_ext"], dtype=np.int64),
+            self.nlist,
+        ]
+        ret3 = md0.forward_common_atomic(*args)
+        ## model output on foo: [[2.8, 3.8, 5], [5.8, 7., 8.]] given bias [1.8, 2]
+        ## foo sumed: [11.6, 20.8] compared with [5, 7], fit target is [-6.6, -13.8]
+        ## fit bias is [-7, 2] (2 is assigned. -7 is fit to [-8.6, -17.8])
+        ## old bias[1.8,2] + fit bias[-7, 2] = [-5.2, 4]
+        ## new model output is [[-4.2, -3.2, 7], [-1.2, 9, 10]]
+        expected_ret3 = {}
+        expected_ret3["foo"] = np.array([[-4.2, -3.2, 7.0], [-1.2, 9.0, 10.0]]).reshape(
+            2, 3, 1
+        )
+        expected_ret3["pix"] = ret0["pix"]
+        for kk in ["foo", "pix"]:
+            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk])
+        # bar is too complicated to be manually computed.
+
+    def test_preset_bias_all_none(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        preset_out_bias = {
+            "foo": [None, None],
+        }
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+            preset_out_bias=preset_out_bias,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+        # nf x nloc
+        at = self.atype_ext[:, :nloc]
+
+        # 1. test run without bias
+        # nf x na x odim
+        ret0 = md0.forward_common_atomic(*args)
+        expected_ret0 = {}
+        expected_ret0["foo"] = np.array(
+            [
+                [1.0, 2.0, 3.0],
+                [4.0, 5.0, 6.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["foo"].shape])
+        expected_ret0["pix"] = np.array(
+            [
+                [3.0, 2.0, 1.0],
+                [6.0, 5.0, 4.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["pix"].shape])
+        expected_ret0["bar"] = np.array(
+            [
+                [1.0, 2.0, 3.0, 7.0, 8.0, 9.0],
+                [4.0, 5.0, 6.0, 10.0, 11.0, 12.0],
+            ]
+        ).reshape([nf, nloc, *md0.fitting_output_def()["bar"].shape])
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret0[kk], expected_ret0[kk])
+
+        # 2. test bias is applied (all None preset = same as no preset)
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        # nt x odim
+        foo_bias = np.array([1.0, 3.0]).reshape(2, 1)
+        bar_bias = np.array([1.0, 5.0, 3.0, 2.0]).reshape(2, 1, 2)
+        expected_ret1 = {}
+        expected_ret1["foo"] = ret0["foo"] + foo_bias[at]
+        expected_ret1["pix"] = ret0["pix"]
+        expected_ret1["bar"] = ret0["bar"] + bar_bias[at]
+        for kk in ["foo", "pix", "bar"]:
+            np.testing.assert_almost_equal(ret1[kk], expected_ret1[kk])
+
+    def test_serialize(self) -> None:
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = InvarFitting(
+            "foo",
+            self.nt,
+            ds.get_dim_out(),
+            1,
+            mixed_types=ds.mixed_types(),
+        )
+        type_map = ["A", "B"]
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret0 = md0.forward_common_atomic(*args)
+        md1 = DPDPAtomicModel.deserialize(md0.serialize())
+        ret1 = md1.forward_common_atomic(*args)
+
+        for kk in ["foo"]:
+            np.testing.assert_almost_equal(ret0[kk], ret1[kk])
+
+
+class TestChangeByStatMixedLabels(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    """Test change-by-statistic with mixed atomic and global labels."""
+
+    def tearDown(self) -> None:
+        self.tempdir.cleanup()
+
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.merged_output_stat = [
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # foo: atomic label
+                "atom_foo": np.array([[5.0, 5.0, 5.0], [5.0, 6.0, 7.0]]).reshape(
+                    2, 3, 1
+                ),
+                # pix: global label
+                "pix": np.array([5.0, 12.0]).reshape(2, 1),
+                # bar: global label
+                "bar": np.array([5.0, 12.0, 7.0, 9.0]).reshape(2, 1, 2),
+                "find_atom_foo": np.float32(1.0),
+                "find_pix": np.float32(1.0),
+                "find_bar": np.float32(1.0),
+            },
+        ]
+        self.tempdir = tempfile.TemporaryDirectory()
+        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
+        with h5py.File(h5file, "w") as f:
+            pass
+        self.stat_file_path = DPPath(h5file, "a")
+
+    def test_change_by_statistic(self) -> None:
+        """Test change-by-statistic with atomic foo + global pix + global bar."""
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = FooFitting()
+        type_map = ["foo", "bar"]
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+
+        ret0 = md0.forward_common_atomic(*args)
+
+        # set initial bias
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+
+        # change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        # use atype_ext from merged_output_stat for inference
+        args = [
+            self.coord_ext,
+            np.array(self.merged_output_stat[0]["atype_ext"], dtype=np.int64),
+            self.nlist,
+        ]
+        ret3 = md0.forward_common_atomic(*args)
+        # foo: atomic label, bias after set-by-stat: [5, 6]
+        # model output with bias [5,6], atype [[0,0,1],[0,1,1]]:
+        #   [[6, 7, 9], [9, 11, 12]]
+        # atom_foo labels: [[5, 5, 5], [5, 6, 7]]
+        # per-atom delta: [[-1, -2, -4], [-4, -5, -5]]
+        # delta bias (mean per type): type0=-7/3, type1=-14/3
+        # new bias = [5-7/3, 6-14/3] = [8/3, 4/3]
+        # new output: [[11/3, 14/3, 13/3], [20/3, 19/3, 22/3]]
+        expected_ret3 = {}
+        expected_ret3["foo"] = np.array(
+            [[3.6667, 4.6667, 4.3333], [6.6667, 6.3333, 7.3333]]
+        ).reshape(2, 3, 1)
+        # pix: global label, bias after set-by-stat: [-2/3, 19/3]
+        # model pix with bias, atype [[0,0,1],[0,1,1]]:
+        #   [[7/3, 4/3, 22/3], [16/3, 34/3, 31/3]], sums [11, 27]
+        # labels [5, 12], delta [-6, -15]
+        # lstsq: delta bias [1, -8], new bias [1/3, -5/3]
+        # new output: [[10/3, 7/3, -2/3], [19/3, 10/3, 7/3]]
+        expected_ret3["pix"] = np.array(
+            [[3.3333, 2.3333, -0.6667], [6.3333, 3.3333, 2.3333]]
+        ).reshape(2, 3, 1)
+        for kk in ["foo", "pix"]:
+            np.testing.assert_almost_equal(ret3[kk], expected_ret3[kk], decimal=4)
+        # bar is too complicated to be manually computed.
+
+
+class TestEnergyModelStat(unittest.TestCase, TestCaseSingleFrameWithNlist):
+    """Test statistics computation with real energy fitting net."""
+
+    def tearDown(self) -> None:
+        self.tempdir.cleanup()
+
+    def setUp(self) -> None:
+        TestCaseSingleFrameWithNlist.setUp(self)
+        self.merged_output_stat = [
+            {
+                "coord": np.zeros([2, 3, 3]),
+                "atype": np.array([[0, 0, 1], [0, 1, 1]], dtype=np.int32),
+                "atype_ext": np.array([[0, 0, 1, 0], [0, 1, 1, 0]], dtype=np.int32),
+                "box": np.zeros([2, 3, 3]),
+                "natoms": np.array([[3, 3, 2, 1], [3, 3, 1, 2]], dtype=np.int32),
+                # energy data
+                "energy": np.array([10.0, 20.0]).reshape(2, 1),
+                "find_energy": np.float32(1.0),
+            },
+        ]
+        self.tempdir = tempfile.TemporaryDirectory()
+        h5file = str((Path(self.tempdir.name) / "testcase.h5").resolve())
+        with h5py.File(h5file, "w") as f:
+            pass
+        self.stat_file_path = DPPath(h5file, "a")
+
+    def test_energy_stat(self) -> None:
+        """Test energy statistics computation with real energy fitting net."""
+        nf, nloc, nnei = self.nlist.shape
+        ds = DescrptSeA(
+            self.rcut,
+            self.rcut_smth,
+            self.sel,
+        )
+        ft = InvarFitting(
+            "energy",
+            self.nt,
+            ds.get_dim_out(),
+            1,
+            mixed_types=ds.mixed_types(),
+        )
+        type_map = ["foo", "bar"]
+        md0 = DPDPAtomicModel(
+            ds,
+            ft,
+            type_map=type_map,
+        )
+        args = [self.coord_ext, self.atype_ext, self.nlist]
+
+        # test run without bias
+        ret0 = md0.forward_common_atomic(*args)
+        self.assertIn("energy", ret0)
+
+        # compute statistics
+        md0.compute_or_load_out_stat(
+            self.merged_output_stat, stat_file_path=self.stat_file_path
+        )
+        ret1 = md0.forward_common_atomic(*args)
+        self.assertIn("energy", ret1)
+
+        # Check that bias was computed (out_bias should be non-zero)
+        self.assertFalse(np.all(md0.out_bias == 0))
+
+        # test bias load from file
+        def raise_error() -> NoReturn:
+            raise RuntimeError
+
+        md0.compute_or_load_out_stat(raise_error, stat_file_path=self.stat_file_path)
+        ret2 = md0.forward_common_atomic(*args)
+        np.testing.assert_allclose(
+            ret1["energy"],
+            ret2["energy"],
+        )
+
+        # test change bias
+        md0.change_out_bias(
+            self.merged_output_stat, bias_adjust_mode="change-by-statistic"
+        )
+        ret3 = md0.forward_common_atomic(*args)
+        self.assertIn("energy", ret3)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/source/tests/pt_expt/atomic_model/test_dp_atomic_model.py b/source/tests/pt_expt/atomic_model/test_dp_atomic_model.py
deleted file mode 100644
index 0196170cd0..0000000000
--- a/source/tests/pt_expt/atomic_model/test_dp_atomic_model.py
+++ /dev/null
@@ -1,288 +0,0 @@
-# SPDX-License-Identifier: LGPL-3.0-or-later
-import itertools
-import unittest
-
-import numpy as np
-import torch
-
-from deepmd.dpmodel.atomic_model import DPAtomicModel as DPDPAtomicModel
-from deepmd.dpmodel.descriptor import DescrptSeA as DPDescrptSeA
-from deepmd.dpmodel.fitting import InvarFitting as DPInvarFitting
-from deepmd.pt_expt.atomic_model import (
-    DPAtomicModel,
-)
-from deepmd.pt_expt.descriptor.se_e2_a import (
-    DescrptSeA,
-)
-from deepmd.pt_expt.fitting import (
-    InvarFitting,
-)
-from deepmd.pt_expt.utils import (
-    env,
-)
-
-from ...pt.model.test_env_mat import (
-    TestCaseSingleFrameWithNlist,
-    TestCaseSingleFrameWithNlistWithVirtual,
-)
-from ...seed import (
-    GLOBAL_SEED,
-)
-
-
-class TestDPAtomicModel(unittest.TestCase, TestCaseSingleFrameWithNlist):
-    def setUp(self) -> None:
-        TestCaseSingleFrameWithNlist.setUp(self)
-        self.device = env.DEVICE
-
-    def test_self_consistency(self) -> None:
-        """Test that pt_expt atomic model serialize/deserialize preserves behavior."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = InvarFitting(
-            "energy",
-            self.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        ).to(self.device)
-        type_map = ["foo", "bar"]
-
-        # test the case of exclusion
-        for atom_excl, pair_excl in itertools.product([[], [1]], [[], [[0, 1]]]):
-            md0 = DPAtomicModel(
-                ds,
-                ft,
-                type_map=type_map,
-            ).to(self.device)
-            md0.reinit_atom_exclude(atom_excl)
-            md0.reinit_pair_exclude(pair_excl)
-            md1 = DPAtomicModel.deserialize(md0.serialize()).to(self.device)
-
-            # Test forward pass
-            args = [
-                torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-                torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-                torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-            ]
-            ret0 = md0.forward_common_atomic(*args)
-            ret1 = md1.forward_common_atomic(*args)
-            np.testing.assert_allclose(
-                ret0["energy"].detach().cpu().numpy(),
-                ret1["energy"].detach().cpu().numpy(),
-            )
-
-    def test_dp_consistency(self) -> None:
-        """Test numerical consistency between dpmodel and pt_expt atomic models."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DPDescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        )
-        ft = DPInvarFitting(
-            "energy",
-            self.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        )
-        type_map = ["foo", "bar"]
-        md0 = DPDPAtomicModel(ds, ft, type_map=type_map)
-        md1 = DPAtomicModel.deserialize(md0.serialize()).to(self.device)
-
-        # dpmodel uses numpy arrays
-        args0 = [self.coord_ext, self.atype_ext, self.nlist]
-        # pt_expt uses torch tensors
-        args1 = [
-            torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-        ]
-        ret0 = md0.forward_common_atomic(*args0)
-        ret1 = md1.forward_common_atomic(*args1)
-        np.testing.assert_allclose(
-            ret0["energy"],
-            ret1["energy"].detach().cpu().numpy(),
-        )
-
-    def test_exportable(self) -> None:
-        """Test that pt_expt atomic model can be exported with torch.export."""
-        nf, nloc, nnei = self.nlist.shape
-        ds = DescrptSeA(
-            self.rcut,
-            self.rcut_smth,
-            self.sel,
-        ).to(self.device)
-        ft = InvarFitting(
-            "energy",
-            self.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        ).to(self.device)
-        type_map = ["foo", "bar"]
-        md0 = DPAtomicModel(ds, ft, type_map=type_map).to(self.device)
-        md0 = md0.eval()
-
-        # Prepare inputs for export
-        coord = torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device)
-        atype = torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device)
-        nlist = torch.tensor(self.nlist, dtype=torch.int64, device=self.device)
-
-        # Test forward pass
-        ret0 = md0(coord, atype, nlist)
-        self.assertIn("energy", ret0)
-
-        # Test torch.export
-        # Use strict=False for now to handle dynamic shapes
-        exported = torch.export.export(
-            md0,
-            (coord, atype, nlist),
-            strict=False,
-        )
-        self.assertIsNotNone(exported)
-
-        # Test exported model produces same output
-        ret1 = exported.module()(coord, atype, nlist)
-        np.testing.assert_allclose(
-            ret0["energy"].detach().cpu().numpy(),
-            ret1["energy"].detach().cpu().numpy(),
-            rtol=1e-10,
-            atol=1e-10,
-        )
-
-    def test_excl_consistency(self) -> None:
-        """Test that exclusion masks work correctly after serialize/deserialize."""
-        type_map = ["foo", "bar"]
-
-        # test the case of exclusion
-        for atom_excl, pair_excl in itertools.product([[], [1]], [[], [[0, 1]]]):
-            ds = DescrptSeA(
-                self.rcut,
-                self.rcut_smth,
-                self.sel,
-            ).to(self.device)
-            ft = InvarFitting(
-                "energy",
-                self.nt,
-                ds.get_dim_out(),
-                1,
-                mixed_types=ds.mixed_types(),
-                seed=GLOBAL_SEED,
-            ).to(self.device)
-            md0 = DPAtomicModel(
-                ds,
-                ft,
-                type_map=type_map,
-            ).to(self.device)
-            md1 = DPAtomicModel.deserialize(md0.serialize()).to(self.device)
-
-            md0.reinit_atom_exclude(atom_excl)
-            md0.reinit_pair_exclude(pair_excl)
-            # hacking!
-            md1.descriptor.reinit_exclude(pair_excl)
-            md1.fitting.reinit_exclude(atom_excl)
-
-            # check energy consistency
-            args = [
-                torch.tensor(self.coord_ext, dtype=torch.float64, device=self.device),
-                torch.tensor(self.atype_ext, dtype=torch.int64, device=self.device),
-                torch.tensor(self.nlist, dtype=torch.int64, device=self.device),
-            ]
-            ret0 = md0.forward_common_atomic(*args)
-            ret1 = md1.forward_common_atomic(*args)
-            np.testing.assert_allclose(
-                ret0["energy"].detach().cpu().numpy(),
-                ret1["energy"].detach().cpu().numpy(),
-            )
-
-            # check output def
-            out_names = [vv.name for vv in md0.atomic_output_def().get_data().values()]
-            self.assertEqual(out_names, ["energy", "mask"])
-            if atom_excl != []:
-                for ii in md0.atomic_output_def().get_data().values():
-                    if ii.name == "mask":
-                        self.assertEqual(ii.shape, [1])
-                        self.assertFalse(ii.reducible)
-                        self.assertFalse(ii.r_differentiable)
-                        self.assertFalse(ii.c_differentiable)
-
-            # check mask
-            if atom_excl == []:
-                pass
-            elif atom_excl == [1]:
-                self.assertIn("mask", ret0.keys())
-                expected = np.array([1, 1, 0], dtype=int)
-                expected = np.concatenate(
-                    [expected, expected[self.perm[: self.nloc]]]
-                ).reshape(2, 3)
-                np.testing.assert_array_equal(
-                    ret0["mask"].detach().cpu().numpy(), expected
-                )
-            else:
-                raise ValueError(f"not expected atom_excl {atom_excl}")
-
-
-class TestDPAtomicModelVirtualConsistency(unittest.TestCase):
-    def setUp(self) -> None:
-        self.case0 = TestCaseSingleFrameWithNlist()
-        self.case1 = TestCaseSingleFrameWithNlistWithVirtual()
-        self.case0.setUp()
-        self.case1.setUp()
-        self.device = env.DEVICE
-
-    def test_virtual_consistency(self) -> None:
-        nf, _, _ = self.case0.nlist.shape
-        ds = DescrptSeA(
-            self.case0.rcut,
-            self.case0.rcut_smth,
-            self.case0.sel,
-        )
-        ft = InvarFitting(
-            "energy",
-            self.case0.nt,
-            ds.get_dim_out(),
-            1,
-            mixed_types=ds.mixed_types(),
-            seed=GLOBAL_SEED,
-        )
-        type_map = ["foo", "bar"]
-        md1 = DPAtomicModel(ds, ft, type_map=type_map).to(self.device)
-
-        args0 = [
-            torch.tensor(self.case0.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.case0.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.case0.nlist, dtype=torch.int64, device=self.device),
-        ]
-        args1 = [
-            torch.tensor(self.case1.coord_ext, dtype=torch.float64, device=self.device),
-            torch.tensor(self.case1.atype_ext, dtype=torch.int64, device=self.device),
-            torch.tensor(self.case1.nlist, dtype=torch.int64, device=self.device),
-        ]
-
-        ret0 = md1.forward_common_atomic(*args0)
-        ret1 = md1.forward_common_atomic(*args1)
-
-        for dd in range(self.case0.nf):
-            np.testing.assert_allclose(
-                ret0["energy"][dd].detach().cpu().numpy(),
-                ret1["energy"][dd, self.case1.get_real_mapping[dd], :]
-                .detach()
-                .cpu()
-                .numpy(),
-            )
-        expected_mask = np.array(
-            [
-                [1, 0, 1, 1],
-                [1, 1, 0, 1],
-            ]
-        )
-        np.testing.assert_equal(ret1["mask"].detach().cpu().numpy(), expected_mask)

From bf448acae4f3b03c27479c046b992f9406a077e3 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 22 Feb 2026 23:55:33 +0800
Subject: [PATCH 07/63] add translated_output_def

---
 deepmd/pt_expt/model/dipole_model.py          | 18 ++++++
 deepmd/pt_expt/model/dos_model.py             | 10 ++++
 deepmd/pt_expt/model/dp_zbl_model.py          | 18 ++++++
 deepmd/pt_expt/model/ener_model.py            | 18 ++++++
 deepmd/pt_expt/model/polar_model.py           | 10 ++++
 deepmd/pt_expt/model/property_model.py        | 11 ++++
 source/tests/consistent/model/test_dipole.py  | 48 ++++++++++++++++
 source/tests/consistent/model/test_dos.py     | 49 ++++++++++++++++
 source/tests/consistent/model/test_dpa1.py    | 47 ++++++++++++++++
 source/tests/consistent/model/test_ener.py    | 10 +++-
 source/tests/consistent/model/test_polar.py   | 48 ++++++++++++++++
 .../tests/consistent/model/test_property.py   | 49 ++++++++++++++++
 .../tests/consistent/model/test_zbl_ener.py   | 56 +++++++++++++++++++
 13 files changed, 389 insertions(+), 3 deletions(-)

diff --git a/deepmd/pt_expt/model/dipole_model.py b/deepmd/pt_expt/model/dipole_model.py
index a2830be7a3..97a07e4968 100644
--- a/deepmd/pt_expt/model/dipole_model.py
+++ b/deepmd/pt_expt/model/dipole_model.py
@@ -95,6 +95,24 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        output_def = {
+            "dipole": out_def_data["dipole"],
+            "global_dipole": out_def_data["dipole_redu"],
+        }
+        if self.do_grad_r("dipole"):
+            output_def["force"] = out_def_data["dipole_derv_r"]
+            output_def["force"].squeeze(-2)
+        if self.do_grad_c("dipole"):
+            output_def["virial"] = out_def_data["dipole_derv_c_redu"]
+            output_def["virial"].squeeze(-2)
+            output_def["atom_virial"] = out_def_data["dipole_derv_c"]
+            output_def["atom_virial"].squeeze(-2)
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/deepmd/pt_expt/model/dos_model.py b/deepmd/pt_expt/model/dos_model.py
index 82991cdb59..ebb35a7ebd 100644
--- a/deepmd/pt_expt/model/dos_model.py
+++ b/deepmd/pt_expt/model/dos_model.py
@@ -83,6 +83,16 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        output_def = {
+            "atom_dos": out_def_data["dos"],
+            "dos": out_def_data["dos_redu"],
+        }
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/deepmd/pt_expt/model/dp_zbl_model.py b/deepmd/pt_expt/model/dp_zbl_model.py
index 83dbd900e3..7b86019345 100644
--- a/deepmd/pt_expt/model/dp_zbl_model.py
+++ b/deepmd/pt_expt/model/dp_zbl_model.py
@@ -97,6 +97,24 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        output_def = {
+            "atom_energy": out_def_data["energy"],
+            "energy": out_def_data["energy_redu"],
+        }
+        if self.do_grad_r("energy"):
+            output_def["force"] = out_def_data["energy_derv_r"]
+            output_def["force"].squeeze(-2)
+        if self.do_grad_c("energy"):
+            output_def["virial"] = out_def_data["energy_derv_c_redu"]
+            output_def["virial"].squeeze(-2)
+            output_def["atom_virial"] = out_def_data["energy_derv_c"]
+            output_def["atom_virial"].squeeze(-2)
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/deepmd/pt_expt/model/ener_model.py b/deepmd/pt_expt/model/ener_model.py
index 0e5e81aebb..c0edb5ebfc 100644
--- a/deepmd/pt_expt/model/ener_model.py
+++ b/deepmd/pt_expt/model/ener_model.py
@@ -97,6 +97,24 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        output_def = {
+            "atom_energy": out_def_data["energy"],
+            "energy": out_def_data["energy_redu"],
+        }
+        if self.do_grad_r("energy"):
+            output_def["force"] = out_def_data["energy_derv_r"]
+            output_def["force"].squeeze(-2)
+        if self.do_grad_c("energy"):
+            output_def["virial"] = out_def_data["energy_derv_c_redu"]
+            output_def["virial"].squeeze(-2)
+            output_def["atom_virial"] = out_def_data["energy_derv_c"]
+            output_def["atom_virial"].squeeze(-2)
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/deepmd/pt_expt/model/polar_model.py b/deepmd/pt_expt/model/polar_model.py
index 337c4771cd..72fa4bd209 100644
--- a/deepmd/pt_expt/model/polar_model.py
+++ b/deepmd/pt_expt/model/polar_model.py
@@ -83,6 +83,16 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        output_def = {
+            "polar": out_def_data["polarizability"],
+            "global_polar": out_def_data["polarizability_redu"],
+        }
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/deepmd/pt_expt/model/property_model.py b/deepmd/pt_expt/model/property_model.py
index 61d99b3840..7a7077865e 100644
--- a/deepmd/pt_expt/model/property_model.py
+++ b/deepmd/pt_expt/model/property_model.py
@@ -89,6 +89,17 @@ def forward_lower(
             model_predict["mask"] = model_ret["mask"]
         return model_predict
 
+    def translated_output_def(self) -> dict[str, Any]:
+        out_def_data = self.model_output_def().get_data()
+        var_name = self.get_var_name()
+        output_def = {
+            f"atom_{var_name}": out_def_data[var_name],
+            var_name: out_def_data[f"{var_name}_redu"],
+        }
+        if "mask" in out_def_data:
+            output_def["mask"] = out_def_data["mask"]
+        return output_def
+
     def forward_lower_exportable(
         self,
         extended_coord: torch.Tensor,
diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index e8de96a02d..7dd7f644cc 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -236,3 +236,51 @@ def test_atom_exclude_types(self):
         tf_obj = self.tf_class.deserialize(data, suffix=self.unique_id)
         pt_obj = self.pt_class.deserialize(data)
         self.assertEqual(tf_obj.get_sel_type(), pt_obj.get_sel_type())
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestDipoleModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 1.8,
+                    "rcut": 6.0,
+                    "neuron": [2, 4, 8],
+                    "resnet_dt": False,
+                    "axis_neuron": 8,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "numb_fparam": 0,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DipoleModelPT.deserialize(serialized)
+        self.pt_expt_model = DipoleModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 12472babb5..84437693d6 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -218,3 +218,52 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
                 ret["atom_dos"].ravel(),
             )
         raise ValueError(f"Unknown backend: {backend}")
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestDOSModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 1.8,
+                    "rcut": 6.0,
+                    "neuron": [2, 4, 8],
+                    "resnet_dt": False,
+                    "axis_neuron": 8,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "numb_fparam": 0,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DOSModelPT.deserialize(serialized)
+        self.pt_expt_model = DOSModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
diff --git a/source/tests/consistent/model/test_dpa1.py b/source/tests/consistent/model/test_dpa1.py
index 1662da1ccd..b32570d024 100644
--- a/source/tests/consistent/model/test_dpa1.py
+++ b/source/tests/consistent/model/test_dpa1.py
@@ -271,3 +271,50 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
                 ret["atom_virial"].ravel(),
             )
         raise ValueError(f"Unknown backend: {backend}")
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestDPA1EnerModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 40,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "seed": 1,
+                    "attn": 128,
+                    "attn_layer": 0,
+                    "precision": "float64",
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = EnergyModelPT.deserialize(serialized)
+        self.pt_expt_model = EnergyModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 0bb1c343bd..5eab6839ed 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -546,7 +546,7 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
         raise ValueError(f"Unknown backend: {backend}")
 
 
-@unittest.skipUnless(INSTALLED_PT, "PyTorch is not installed")
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestEnerModelAPIs(unittest.TestCase):
     """Test consistency of model-level APIs between pt and dpmodel backends.
 
@@ -584,10 +584,11 @@ def setUp(self) -> None:
             },
             trim_pattern="_*",
         )
-        # Build dpmodel first, then deserialize into pt to share weights
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = EnergyModelPT.deserialize(serialized)
+        self.pt_expt_model = EnergyModelPTExpt.deserialize(serialized)
 
         # Coords / atype / box
         self.coords = np.array(
@@ -643,12 +644,15 @@ def setUp(self) -> None:
         self.nlist = nlist
 
     def test_translated_output_def(self) -> None:
-        """translated_output_def should return the same keys on dp and pt."""
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
         pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
         self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
 
     def test_get_descriptor(self) -> None:
         """get_descriptor should return a non-None object on both backends."""
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 1389cb33d7..a8cd8c0ac6 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -230,3 +230,51 @@ def test_atom_exclude_types(self):
         tf_obj = self.tf_class.deserialize(data, suffix=self.unique_id)
         pt_obj = self.pt_class.deserialize(data)
         self.assertEqual(tf_obj.get_sel_type(), pt_obj.get_sel_type())
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestPolarModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 1.8,
+                    "rcut": 6.0,
+                    "neuron": [2, 4, 8],
+                    "resnet_dt": False,
+                    "axis_neuron": 8,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "numb_fparam": 0,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = PolarModelPT.deserialize(serialized)
+        self.pt_expt_model = PolarModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index ca2507a980..2c4bf31114 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -215,3 +215,52 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
                 ret[f"atom_{property_name}"].ravel(),
             )
         raise ValueError(f"Unknown backend: {backend}")
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestPropertyModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 1.8,
+                    "rcut": 6.0,
+                    "neuron": [2, 4, 8],
+                    "resnet_dt": False,
+                    "axis_neuron": 8,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "neuron": [4, 4, 4],
+                    "property_name": "foo",
+                    "resnet_dt": True,
+                    "numb_fparam": 0,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = PropertyModelPT.deserialize(serialized)
+        self.pt_expt_model = PropertyModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index d6ceba73d3..88bcd86b2e 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -248,3 +248,59 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
                 ret["virial"].ravel(),
             )
         raise ValueError(f"Unknown backend: {backend}")
+
+
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
+class TestZBLEnerModelAPIs(unittest.TestCase):
+    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+
+    def setUp(self) -> None:
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H", "B"],
+                "use_srtab": f"{TESTS_DIR}/pt/water/data/zbl_tab_potential/H2O_tab_potential.txt",
+                "smin_alpha": 0.1,
+                "sw_rmin": 0.2,
+                "sw_rmax": 4.0,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 40,
+                    "rcut_smth": 0.5,
+                    "rcut": 4.0,
+                    "neuron": [3, 6],
+                    "axis_neuron": 2,
+                    "attn": 8,
+                    "attn_layer": 2,
+                    "attn_dotr": True,
+                    "attn_mask": False,
+                    "activation_function": "tanh",
+                    "scaling_factor": 1.0,
+                    "normalize": False,
+                    "temperature": 1.0,
+                    "set_davg_zero": True,
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DPZBLModelPT.deserialize(serialized)
+        self.pt_expt_model = DPZBLModelPTExpt.deserialize(serialized)
+
+    def test_translated_output_def(self) -> None:
+        """translated_output_def should return the same keys on dp, pt, and pt_expt."""
+        dp_def = self.dp_model.translated_output_def()
+        pt_def = self.pt_model.translated_output_def()
+        pt_expt_def = self.pt_expt_model.translated_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        self.assertEqual(set(dp_def.keys()), set(pt_expt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+            self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)

From 9572a041c4eb3807bcc35e570f507c0e04dd2ce8 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 23 Feb 2026 00:08:34 +0800
Subject: [PATCH 08/63] base model registration

---
 deepmd/pt_expt/model/dipole_model.py   |  6 ++++--
 deepmd/pt_expt/model/dos_model.py      |  6 ++++--
 deepmd/pt_expt/model/dp_zbl_model.py   |  6 ++++--
 deepmd/pt_expt/model/ener_model.py     |  6 ++++--
 deepmd/pt_expt/model/model.py          | 24 ++++++++++++++++++++++++
 deepmd/pt_expt/model/polar_model.py    |  6 ++++--
 deepmd/pt_expt/model/property_model.py |  6 ++++--
 7 files changed, 48 insertions(+), 12 deletions(-)
 create mode 100644 deepmd/pt_expt/model/model.py

diff --git a/deepmd/pt_expt/model/dipole_model.py b/deepmd/pt_expt/model/dipole_model.py
index 97a07e4968..9341713fdc 100644
--- a/deepmd/pt_expt/model/dipole_model.py
+++ b/deepmd/pt_expt/model/dipole_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPDipoleModel_ = make_model(DPDipoleAtomicModel)
 
 
+@BaseModel.register("dipole")
 class DipoleModel(DPModelCommon, DPDipoleModel_):
-    model_type = "dipole"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/pt_expt/model/dos_model.py b/deepmd/pt_expt/model/dos_model.py
index ebb35a7ebd..a34666ac2f 100644
--- a/deepmd/pt_expt/model/dos_model.py
+++ b/deepmd/pt_expt/model/dos_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPDOSModel_ = make_model(DPDOSAtomicModel)
 
 
+@BaseModel.register("dos")
 class DOSModel(DPModelCommon, DPDOSModel_):
-    model_type = "dos"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/pt_expt/model/dp_zbl_model.py b/deepmd/pt_expt/model/dp_zbl_model.py
index 7b86019345..4d905d52de 100644
--- a/deepmd/pt_expt/model/dp_zbl_model.py
+++ b/deepmd/pt_expt/model/dp_zbl_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel)
 
 
+@BaseModel.register("zbl")
 class DPZBLModel(DPModelCommon, DPZBLModel_):
-    model_type = "zbl"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/pt_expt/model/ener_model.py b/deepmd/pt_expt/model/ener_model.py
index c0edb5ebfc..78be0f7acd 100644
--- a/deepmd/pt_expt/model/ener_model.py
+++ b/deepmd/pt_expt/model/ener_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPEnergyModel_ = make_model(DPEnergyAtomicModel)
 
 
+@BaseModel.register("ener")
 class EnergyModel(DPModelCommon, DPEnergyModel_):
-    model_type = "ener"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/pt_expt/model/model.py b/deepmd/pt_expt/model/model.py
new file mode 100644
index 0000000000..da3fc08418
--- /dev/null
+++ b/deepmd/pt_expt/model/model.py
@@ -0,0 +1,24 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from deepmd.dpmodel.model.base_model import (
+    make_base_model,
+)
+
+
+class BaseModel(make_base_model()):
+    """Base class for pt_expt models.
+
+    Provides the plugin registry so that model classes can be
+    registered with ``@BaseModel.register("ener")`` etc.
+
+    See Also
+    --------
+    deepmd.dpmodel.model.base_model.BaseBaseModel
+        Backend-independent BaseModel class.
+    """
+
+    def __init__(self) -> None:
+        self.model_def_script = ""
+
+    def get_model_def_script(self) -> str:
+        """Get the model definition script."""
+        return self.model_def_script
diff --git a/deepmd/pt_expt/model/polar_model.py b/deepmd/pt_expt/model/polar_model.py
index 72fa4bd209..68d247ff2b 100644
--- a/deepmd/pt_expt/model/polar_model.py
+++ b/deepmd/pt_expt/model/polar_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPPolarModel_ = make_model(DPPolarAtomicModel)
 
 
+@BaseModel.register("polar")
 class PolarModel(DPModelCommon, DPPolarModel_):
-    model_type = "polar"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/pt_expt/model/property_model.py b/deepmd/pt_expt/model/property_model.py
index 7a7077865e..1813a11535 100644
--- a/deepmd/pt_expt/model/property_model.py
+++ b/deepmd/pt_expt/model/property_model.py
@@ -18,13 +18,15 @@
 from .make_model import (
     make_model,
 )
+from .model import (
+    BaseModel,
+)
 
 DPPropertyModel_ = make_model(DPPropertyAtomicModel)
 
 
+@BaseModel.register("property")
 class PropertyModel(DPModelCommon, DPPropertyModel_):
-    model_type = "property"
-
     def __init__(
         self,
         *args: Any,

From 0dcd03b6b4cc9908d7b89056d113dd7e264a4051 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 23 Feb 2026 21:55:46 +0800
Subject: [PATCH 09/63] implement compute_or_load_stat

---
 .../dpmodel/atomic_model/base_atomic_model.py | 52 +++++++++++++++++++
 .../dpmodel/atomic_model/dp_atomic_model.py   | 35 +++++++++++++
 .../atomic_model/linear_atomic_model.py       | 38 ++++++++++++++
 .../atomic_model/pairtab_atomic_model.py      | 30 +++++++++++
 deepmd/dpmodel/model/make_model.py            | 20 +++++++
 5 files changed, 175 insertions(+)

diff --git a/deepmd/dpmodel/atomic_model/base_atomic_model.py b/deepmd/dpmodel/atomic_model/base_atomic_model.py
index 3c9c595221..748daad405 100644
--- a/deepmd/dpmodel/atomic_model/base_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/base_atomic_model.py
@@ -1,4 +1,5 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+import functools
 import math
 from collections.abc import (
     Callable,
@@ -287,6 +288,57 @@ def compute_or_load_out_stat(
             bias_adjust_mode="set-by-statistic",
         )
 
+    def _make_wrapped_sampler(
+        self,
+        sampled_func: Callable[[], list[dict]],
+    ) -> Callable[[], list[dict]]:
+        """Wrap the sampled function with exclusion types and default fparam.
+
+        The returned callable is cached so that the sampling (which may be
+        expensive) is performed at most once.
+
+        Parameters
+        ----------
+        sampled_func
+            The lazy sampled function to get data frames from different data
+            systems.
+
+        Returns
+        -------
+        Callable[[], list[dict]]
+            A cached wrapper around *sampled_func* that additionally sets
+            ``pair_exclude_types``, ``atom_exclude_types`` and default
+            ``fparam`` on every sample dict when applicable.
+        """
+
+        @functools.lru_cache
+        def wrapped_sampler() -> list[dict]:
+            sampled = sampled_func()
+            if self.pair_excl is not None:
+                pair_exclude_types = self.pair_excl.get_exclude_types()
+                for sample in sampled:
+                    sample["pair_exclude_types"] = list(pair_exclude_types)
+            if self.atom_excl is not None:
+                atom_exclude_types = self.atom_excl.get_exclude_types()
+                for sample in sampled:
+                    sample["atom_exclude_types"] = list(atom_exclude_types)
+            if (
+                "find_fparam" not in sampled[0]
+                and "fparam" not in sampled[0]
+                and self.has_default_fparam()
+            ):
+                default_fparam = self.get_default_fparam()
+                if default_fparam is not None:
+                    default_fparam_np = np.array(default_fparam)
+                    for sample in sampled:
+                        nframe = sample["atype"].shape[0]
+                        sample["fparam"] = np.tile(
+                            default_fparam_np.reshape(1, -1), (nframe, 1)
+                        )
+            return sampled
+
+        return wrapped_sampler
+
     def change_out_bias(
         self,
         sample_merged: Callable[[], list[dict]] | list[dict],
diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index 0f5b12bc9c..43dab66b7b 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -1,4 +1,7 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+from collections.abc import (
+    Callable,
+)
 from typing import (
     Any,
 )
@@ -15,6 +18,9 @@
 from deepmd.dpmodel.output_def import (
     FittingOutputDef,
 )
+from deepmd.utils.path import (
+    DPPath,
+)
 from deepmd.utils.version import (
     check_version_compatibility,
 )
@@ -177,6 +183,35 @@ def forward_atomic(
         )
         return ret
 
+    def compute_or_load_stat(
+        self,
+        sampled_func: Callable[[], list[dict]],
+        stat_file_path: DPPath | None = None,
+        compute_or_load_out_stat: bool = True,
+    ) -> None:
+        """Compute or load the statistics parameters of the model,
+        such as mean and standard deviation of descriptors or the energy bias of the fitting net.
+
+        Parameters
+        ----------
+        sampled_func
+            The lazy sampled function to get data frames from different data systems.
+        stat_file_path
+            The path to the stat file.
+        compute_or_load_out_stat : bool
+            Whether to compute the output statistics.
+            If False, it will only compute the input statistics
+            (e.g. mean and standard deviation of descriptors).
+        """
+        if stat_file_path is not None and self.type_map is not None:
+            stat_file_path /= " ".join(self.type_map)
+
+        wrapped_sampler = self._make_wrapped_sampler(sampled_func)
+        self.descriptor.compute_input_stats(wrapped_sampler, stat_file_path)
+        self.fitting.compute_input_stats(wrapped_sampler)
+        if compute_or_load_out_stat:
+            self.compute_or_load_out_stat(wrapped_sampler, stat_file_path)
+
     def change_type_map(
         self, type_map: list[str], model_with_new_type_stat: Any | None = None
     ) -> None:
diff --git a/deepmd/dpmodel/atomic_model/linear_atomic_model.py b/deepmd/dpmodel/atomic_model/linear_atomic_model.py
index ce54a40333..cba3d923e5 100644
--- a/deepmd/dpmodel/atomic_model/linear_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/linear_atomic_model.py
@@ -1,4 +1,7 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+from collections.abc import (
+    Callable,
+)
 from typing import (
     Any,
 )
@@ -17,6 +20,9 @@
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
+from deepmd.utils.path import (
+    DPPath,
+)
 from deepmd.utils.version import (
     check_version_compatibility,
 )
@@ -327,6 +333,38 @@ def deserialize(cls, data: dict) -> "LinearEnergyAtomicModel":
         data["models"] = models
         return super().deserialize(data)
 
+    def compute_or_load_stat(
+        self,
+        sampled_func: Callable[[], list[dict]],
+        stat_file_path: DPPath | None = None,
+        compute_or_load_out_stat: bool = True,
+    ) -> None:
+        """Compute or load the statistics parameters of the model.
+
+        For LinearEnergyAtomicModel, this first computes input stats for each
+        sub-model (without output stats), then computes its own output stats.
+
+        Parameters
+        ----------
+        sampled_func
+            The lazy sampled function to get data frames from different data systems.
+        stat_file_path
+            The path to the stat file.
+        compute_or_load_out_stat : bool
+            Whether to compute the output statistics.
+        """
+        for md in self.models:
+            md.compute_or_load_stat(
+                sampled_func, stat_file_path, compute_or_load_out_stat=False
+            )
+
+        if stat_file_path is not None and self.type_map is not None:
+            stat_file_path /= " ".join(self.type_map)
+
+        if compute_or_load_out_stat:
+            wrapped_sampler = self._make_wrapped_sampler(sampled_func)
+            self.compute_or_load_out_stat(wrapped_sampler, stat_file_path)
+
     def _compute_weight(
         self,
         extended_coord: Array,
diff --git a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
index ed063f4727..11156e9f93 100644
--- a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
@@ -1,4 +1,7 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+from collections.abc import (
+    Callable,
+)
 from typing import (
     Any,
     NoReturn,
@@ -21,6 +24,9 @@
 from deepmd.utils.pair_tab import (
     PairTab,
 )
+from deepmd.utils.path import (
+    DPPath,
+)
 from deepmd.utils.version import (
     check_version_compatibility,
 )
@@ -199,6 +205,30 @@ def deserialize(cls, data: dict) -> "PairTabAtomicModel":
         tab_model.tab_data = tab.tab_data.reshape(ntypes, ntypes, nspline, 4)
         return tab_model
 
+    def compute_or_load_stat(
+        self,
+        sampled_func: Callable[[], list[dict]],
+        stat_file_path: DPPath | None = None,
+        compute_or_load_out_stat: bool = True,
+    ) -> None:
+        """Compute or load the statistics parameters of the model.
+
+        PairTabAtomicModel has no descriptor or fitting net input stats,
+        so this only computes output stats (energy bias) when requested.
+
+        Parameters
+        ----------
+        sampled_func
+            The lazy sampled function to get data frames from different data systems.
+        stat_file_path
+            The path to the stat file.
+        compute_or_load_out_stat : bool
+            Whether to compute the output statistics.
+        """
+        if compute_or_load_out_stat:
+            wrapped_sampler = self._make_wrapped_sampler(sampled_func)
+            self.compute_or_load_out_stat(wrapped_sampler, stat_file_path)
+
     def forward_atomic(
         self,
         extended_coord: Array,
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index 37da9cf056..1434ea5720 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -39,6 +39,9 @@
     nlist_distinguish_types,
     normalize_coord,
 )
+from deepmd.utils.path import (
+    DPPath,
+)
 
 from .transform_output import (
     communicate_extended_output,
@@ -684,6 +687,23 @@ def atomic_output_def(self) -> FittingOutputDef:
             """Get the output def of the atomic model."""
             return self.atomic_model.atomic_output_def()
 
+        def compute_or_load_stat(
+            self,
+            sampled_func: Callable[[], Any],
+            stat_file_path: DPPath | None = None,
+        ) -> None:
+            """Compute or load the statistics parameters of the model.
+
+            Parameters
+            ----------
+            sampled_func
+                The lazy sampled function to get data frames from different
+                data systems.
+            stat_file_path
+                The path to the stat file.
+            """
+            self.atomic_model.compute_or_load_stat(sampled_func, stat_file_path)
+
         def get_ntypes(self) -> int:
             """Get the number of types."""
             return len(self.get_type_map())

From 28fbd0887876f6827cbbc03d049b623cec1f0a44 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 23 Feb 2026 22:20:28 +0800
Subject: [PATCH 10/63] fix bug in test_ener

---
 source/tests/consistent/model/test_ener.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 5eab6839ed..faabb0fc1e 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -146,7 +146,7 @@ def get_reference_backend(self):
 
     @property
     def skip_tf(self):
-        return (
+        return not INSTALLED_TF or (
             self.data["pair_exclude_types"] != []
             or self.data["atom_exclude_types"] != []
         )

From 237e4a8afc7d6ad3ba425dbd429ac9c305b51a5e Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 23 Feb 2026 22:40:04 +0800
Subject: [PATCH 11/63] refact make_model, concrete models from different
 backends inherit from the base models of the corresponding backend

---
 deepmd/dpmodel/model/dipole_model.py   |  5 ++++-
 deepmd/dpmodel/model/dos_model.py      |  5 ++++-
 deepmd/dpmodel/model/dp_zbl_model.py   |  5 ++++-
 deepmd/dpmodel/model/ener_model.py     |  5 ++++-
 deepmd/dpmodel/model/make_model.py     | 17 ++++++++++-------
 deepmd/dpmodel/model/polar_model.py    |  5 ++++-
 deepmd/dpmodel/model/property_model.py |  5 ++++-
 deepmd/dpmodel/model/spin_model.py     |  2 +-
 deepmd/pt_expt/model/__init__.py       |  4 ++++
 deepmd/pt_expt/model/dipole_model.py   |  2 +-
 deepmd/pt_expt/model/dos_model.py      |  2 +-
 deepmd/pt_expt/model/dp_zbl_model.py   |  2 +-
 deepmd/pt_expt/model/ener_model.py     |  2 +-
 deepmd/pt_expt/model/make_model.py     | 11 +++++++++--
 deepmd/pt_expt/model/model.py          |  1 +
 deepmd/pt_expt/model/polar_model.py    |  2 +-
 deepmd/pt_expt/model/property_model.py |  2 +-
 17 files changed, 55 insertions(+), 22 deletions(-)

diff --git a/deepmd/dpmodel/model/dipole_model.py b/deepmd/dpmodel/model/dipole_model.py
index 421dd1b10f..9121321347 100644
--- a/deepmd/dpmodel/model/dipole_model.py
+++ b/deepmd/dpmodel/model/dipole_model.py
@@ -9,6 +9,9 @@
 from deepmd.dpmodel.atomic_model import (
     DPDipoleAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -20,7 +23,7 @@
     make_model,
 )
 
-DPDipoleModel_ = make_model(DPDipoleAtomicModel)
+DPDipoleModel_ = make_model(DPDipoleAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("dipole")
diff --git a/deepmd/dpmodel/model/dos_model.py b/deepmd/dpmodel/model/dos_model.py
index dded7b076a..54a5ba0ed2 100644
--- a/deepmd/dpmodel/model/dos_model.py
+++ b/deepmd/dpmodel/model/dos_model.py
@@ -9,6 +9,9 @@
 from deepmd.dpmodel.atomic_model import (
     DPDOSAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -20,7 +23,7 @@
     make_model,
 )
 
-DPDOSModel_ = make_model(DPDOSAtomicModel)
+DPDOSModel_ = make_model(DPDOSAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("dos")
diff --git a/deepmd/dpmodel/model/dp_zbl_model.py b/deepmd/dpmodel/model/dp_zbl_model.py
index 81c2476447..289d81473a 100644
--- a/deepmd/dpmodel/model/dp_zbl_model.py
+++ b/deepmd/dpmodel/model/dp_zbl_model.py
@@ -9,6 +9,9 @@
 from deepmd.dpmodel.atomic_model.linear_atomic_model import (
     DPZBLLinearEnergyAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -23,7 +26,7 @@
     make_model,
 )
 
-DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel)
+DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("zbl")
diff --git a/deepmd/dpmodel/model/ener_model.py b/deepmd/dpmodel/model/ener_model.py
index ac90d94fc5..ffeaf54779 100644
--- a/deepmd/dpmodel/model/ener_model.py
+++ b/deepmd/dpmodel/model/ener_model.py
@@ -12,6 +12,9 @@
 from deepmd.dpmodel.atomic_model import (
     DPEnergyAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -26,7 +29,7 @@
     make_model,
 )
 
-DPEnergyModel_ = make_model(DPEnergyAtomicModel)
+DPEnergyModel_ = make_model(DPEnergyAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("ener")
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index 37da9cf056..3be4738fe6 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -20,12 +20,8 @@
     GLOBAL_NP_FLOAT_PRECISION,
     PRECISION_DICT,
     RESERVED_PRECISION_DICT,
-    NativeOP,
     get_xp_precision,
 )
-from deepmd.dpmodel.model.base_model import (
-    BaseModel,
-)
 from deepmd.dpmodel.output_def import (
     FittingOutputDef,
     ModelOutputDef,
@@ -138,7 +134,10 @@ def model_call_from_call_lower(
     return model_predict
 
 
-def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
+def make_model(
+    T_AtomicModel: type[BaseAtomicModel],
+    T_Bases: tuple[type, ...] = (),
+) -> type:
     """Make a model as a derived class of an atomic model.
 
     The model provide two interfaces.
@@ -153,6 +152,9 @@ def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
     ----------
     T_AtomicModel
         The atomic model.
+    T_Bases
+        Additional base classes for the returned model class.
+        Defaults to ``()``.  For example, dpmodel passes ``(NativeOP,)``.
 
     Returns
     -------
@@ -161,7 +163,7 @@ def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
 
     """
 
-    class CM(NativeOP, BaseModel):
+    class CM(*T_Bases):
         def __init__(
             self,
             *args: Any,
@@ -169,7 +171,8 @@ def __init__(
             atomic_model_: T_AtomicModel | None = None,
             **kwargs: Any,
         ) -> None:
-            BaseModel.__init__(self)
+            self.model_def_script = ""
+            self.min_nbor_dist = None
             if atomic_model_ is not None:
                 self.atomic_model: T_AtomicModel = atomic_model_
             else:
diff --git a/deepmd/dpmodel/model/polar_model.py b/deepmd/dpmodel/model/polar_model.py
index 057410f280..ad5a47726e 100644
--- a/deepmd/dpmodel/model/polar_model.py
+++ b/deepmd/dpmodel/model/polar_model.py
@@ -9,6 +9,9 @@
 from deepmd.dpmodel.atomic_model import (
     DPPolarAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -20,7 +23,7 @@
     make_model,
 )
 
-DPPolarModel_ = make_model(DPPolarAtomicModel)
+DPPolarModel_ = make_model(DPPolarAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("polar")
diff --git a/deepmd/dpmodel/model/property_model.py b/deepmd/dpmodel/model/property_model.py
index ea34609393..bc1657f0bd 100644
--- a/deepmd/dpmodel/model/property_model.py
+++ b/deepmd/dpmodel/model/property_model.py
@@ -9,6 +9,9 @@
 from deepmd.dpmodel.atomic_model import (
     DPPropertyAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.base_model import (
     BaseModel,
 )
@@ -23,7 +26,7 @@
     make_model,
 )
 
-DPPropertyModel_ = make_model(DPPropertyAtomicModel)
+DPPropertyModel_ = make_model(DPPropertyAtomicModel, T_Bases=(NativeOP, BaseModel))
 
 
 @BaseModel.register("property")
diff --git a/deepmd/dpmodel/model/spin_model.py b/deepmd/dpmodel/model/spin_model.py
index 85e23df3cc..482b61f7be 100644
--- a/deepmd/dpmodel/model/spin_model.py
+++ b/deepmd/dpmodel/model/spin_model.py
@@ -326,7 +326,7 @@ def serialize(self) -> dict:
 
     @classmethod
     def deserialize(cls, data: dict) -> "SpinModel":
-        backbone_model_obj = make_model(DPAtomicModel).deserialize(
+        backbone_model_obj = make_model(DPAtomicModel, T_Bases=(NativeOP,)).deserialize(
             data["backbone_model"]
         )
         spin = Spin.deserialize(data["spin"])
diff --git a/deepmd/pt_expt/model/__init__.py b/deepmd/pt_expt/model/__init__.py
index 858bdef6f7..da120091e0 100644
--- a/deepmd/pt_expt/model/__init__.py
+++ b/deepmd/pt_expt/model/__init__.py
@@ -11,6 +11,9 @@
 from .ener_model import (
     EnergyModel,
 )
+from .model import (
+    BaseModel,
+)
 from .polar_model import (
     PolarModel,
 )
@@ -19,6 +22,7 @@
 )
 
 __all__ = [
+    "BaseModel",
     "DOSModel",
     "DPZBLModel",
     "DipoleModel",
diff --git a/deepmd/pt_expt/model/dipole_model.py b/deepmd/pt_expt/model/dipole_model.py
index 9341713fdc..73ebba6bac 100644
--- a/deepmd/pt_expt/model/dipole_model.py
+++ b/deepmd/pt_expt/model/dipole_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPDipoleModel_ = make_model(DPDipoleAtomicModel)
+DPDipoleModel_ = make_model(DPDipoleAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("dipole")
diff --git a/deepmd/pt_expt/model/dos_model.py b/deepmd/pt_expt/model/dos_model.py
index a34666ac2f..137c2b2901 100644
--- a/deepmd/pt_expt/model/dos_model.py
+++ b/deepmd/pt_expt/model/dos_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPDOSModel_ = make_model(DPDOSAtomicModel)
+DPDOSModel_ = make_model(DPDOSAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("dos")
diff --git a/deepmd/pt_expt/model/dp_zbl_model.py b/deepmd/pt_expt/model/dp_zbl_model.py
index 4d905d52de..c4bb668353 100644
--- a/deepmd/pt_expt/model/dp_zbl_model.py
+++ b/deepmd/pt_expt/model/dp_zbl_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel)
+DPZBLModel_ = make_model(DPZBLLinearEnergyAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("zbl")
diff --git a/deepmd/pt_expt/model/ener_model.py b/deepmd/pt_expt/model/ener_model.py
index 78be0f7acd..271028d2ff 100644
--- a/deepmd/pt_expt/model/ener_model.py
+++ b/deepmd/pt_expt/model/ener_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPEnergyModel_ = make_model(DPEnergyAtomicModel)
+DPEnergyModel_ = make_model(DPEnergyAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("ener")
diff --git a/deepmd/pt_expt/model/make_model.py b/deepmd/pt_expt/model/make_model.py
index 2785fade14..56cabafe81 100644
--- a/deepmd/pt_expt/model/make_model.py
+++ b/deepmd/pt_expt/model/make_model.py
@@ -18,7 +18,10 @@
 )
 
 
-def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
+def make_model(
+    T_AtomicModel: type[BaseAtomicModel],
+    T_Bases: tuple[type, ...] = (),
+) -> type:
     """Make a model as a derived class of an atomic model.
 
     Wraps dpmodel's make_model with torch.nn.Module and overrides
@@ -28,6 +31,10 @@ def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
     ----------
     T_AtomicModel
         The atomic model.
+    T_Bases
+        Additional base classes for the returned model class.
+        For example, pass ``(BaseModel,)`` so that the concrete model
+        inherits the pt_expt ``BaseModel`` plugin registry.
 
     Returns
     -------
@@ -38,7 +45,7 @@ def make_model(T_AtomicModel: type[BaseAtomicModel]) -> type:
     DPModel = make_model_dp(T_AtomicModel)
 
     @torch_module
-    class CM(DPModel):
+    class CM(DPModel, *T_Bases):
         def forward(self, *args: Any, **kwargs: Any) -> dict[str, torch.Tensor]:
             """Default forward delegates to call().
 
diff --git a/deepmd/pt_expt/model/model.py b/deepmd/pt_expt/model/model.py
index da3fc08418..f7d8d86e14 100644
--- a/deepmd/pt_expt/model/model.py
+++ b/deepmd/pt_expt/model/model.py
@@ -18,6 +18,7 @@ class BaseModel(make_base_model()):
 
     def __init__(self) -> None:
         self.model_def_script = ""
+        self.min_nbor_dist = None
 
     def get_model_def_script(self) -> str:
         """Get the model definition script."""
diff --git a/deepmd/pt_expt/model/polar_model.py b/deepmd/pt_expt/model/polar_model.py
index 68d247ff2b..2bec72d4f7 100644
--- a/deepmd/pt_expt/model/polar_model.py
+++ b/deepmd/pt_expt/model/polar_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPPolarModel_ = make_model(DPPolarAtomicModel)
+DPPolarModel_ = make_model(DPPolarAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("polar")
diff --git a/deepmd/pt_expt/model/property_model.py b/deepmd/pt_expt/model/property_model.py
index 1813a11535..50f8f0eeb4 100644
--- a/deepmd/pt_expt/model/property_model.py
+++ b/deepmd/pt_expt/model/property_model.py
@@ -22,7 +22,7 @@
     BaseModel,
 )
 
-DPPropertyModel_ = make_model(DPPropertyAtomicModel)
+DPPropertyModel_ = make_model(DPPropertyAtomicModel, T_Bases=(BaseModel,))
 
 
 @BaseModel.register("property")

From 2a958ec74c87c6c129a2b621e666a5b653df0898 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 00:38:32 +0800
Subject: [PATCH 12/63] Add compute_or_load_stat consistency tests and fix
 dpmodel backend bugs

  Add TestEnerComputeOrLoadStat to the consistency test framework, comparing
  dp, pt, and pt_expt backends after compute_or_load_stat. Tests cover
  descriptor stats, fparam/aparam fitting stats, output bias, and forward
  consistency, parameterized over exclusion types and fparam source
  (default injection vs explicit data). Both compute and load-from-file
  paths are tested.

  Three dpmodel bugs found and fixed:
  - repflows.py: compute_input_stats now respects set_stddev_constant,
    matching the pt backend behavior
  - stat.py: compute_output_stats_global now applies atom_exclude_types
    mask to natoms before computing output bias
  - general_fitting.py: compute_input_stats now supports save/load of
    fparam/aparam stats via stat_file_path, matching the pt backend
---
 .../dpmodel/atomic_model/dp_atomic_model.py   |   2 +-
 deepmd/dpmodel/descriptor/repflows.py         |   9 +-
 deepmd/dpmodel/fitting/general_fitting.py     | 136 +++++--
 deepmd/dpmodel/utils/stat.py                  |   9 +
 source/tests/consistent/model/test_ener.py    | 356 ++++++++++++++++++
 5 files changed, 477 insertions(+), 35 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index 43dab66b7b..f110e58d2c 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -208,7 +208,7 @@ def compute_or_load_stat(
 
         wrapped_sampler = self._make_wrapped_sampler(sampled_func)
         self.descriptor.compute_input_stats(wrapped_sampler, stat_file_path)
-        self.fitting.compute_input_stats(wrapped_sampler)
+        self.fitting.compute_input_stats(wrapped_sampler, stat_file_path=stat_file_path)
         if compute_or_load_out_stat:
             self.compute_or_load_out_stat(wrapped_sampler, stat_file_path)
 
diff --git a/deepmd/dpmodel/descriptor/repflows.py b/deepmd/dpmodel/descriptor/repflows.py
index 3188bbfee5..d2fc06a478 100644
--- a/deepmd/dpmodel/descriptor/repflows.py
+++ b/deepmd/dpmodel/descriptor/repflows.py
@@ -438,6 +438,8 @@ def compute_input_stats(
             The path to the stat file.
 
         """
+        if self.set_stddev_constant and self.set_davg_zero:
+            return
         env_mat_stat = EnvMatStatSe(self)
         if path is not None:
             path = path / env_mat_stat.get_hash()
@@ -458,9 +460,10 @@ def compute_input_stats(
             self.mean = xp.asarray(
                 mean, dtype=self.mean.dtype, copy=True, device=device
             )
-        self.stddev = xp.asarray(
-            stddev, dtype=self.stddev.dtype, copy=True, device=device
-        )
+        if not self.set_stddev_constant:
+            self.stddev = xp.asarray(
+                stddev, dtype=self.stddev.dtype, copy=True, device=device
+            )
 
     def get_stats(self) -> dict[str, StatItem]:
         """Get the statistics of the descriptor."""
diff --git a/deepmd/dpmodel/fitting/general_fitting.py b/deepmd/dpmodel/fitting/general_fitting.py
index 260be619fd..d82421cc8d 100644
--- a/deepmd/dpmodel/fitting/general_fitting.py
+++ b/deepmd/dpmodel/fitting/general_fitting.py
@@ -35,10 +35,16 @@
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
+from deepmd.utils.env_mat_stat import (
+    StatItem,
+)
 from deepmd.utils.finetune import (
     get_index_between_two_maps,
     map_atom_exclude_types,
 )
+from deepmd.utils.path import (
+    DPPath,
+)
 
 from .base_fitting import (
     BaseFitting,
@@ -226,6 +232,7 @@ def compute_input_stats(
         self,
         merged: Callable[[], list[dict]] | list[dict],
         protection: float = 1e-2,
+        stat_file_path: DPPath | None = None,
     ) -> None:
         """
         Compute the input statistics (e.g. mean and stddev) for the fittings from packed data.
@@ -241,27 +248,48 @@ def compute_input_stats(
                 the lazy function helps by only sampling once.
         protection : float
             Divided-by-zero protection
+        stat_file_path : Optional[DPPath]
+            The path to the stat file.
         """
         if self.numb_fparam == 0 and self.numb_aparam == 0:
             # skip data statistics
             return
-        if callable(merged):
-            sampled = merged()
-        else:
-            sampled = merged
         # stat fparam
         if self.numb_fparam > 0:
-            cat_data = np.concatenate([frame["fparam"] for frame in sampled], axis=0)
-            cat_data = np.reshape(cat_data, [-1, self.numb_fparam])
-            fparam_avg = np.mean(cat_data, axis=0)
-            fparam_std = np.std(cat_data, axis=0, ddof=0)  # ddof=0 for population std
-            fparam_std = np.where(
-                fparam_std < protection,
-                np.array(protection, dtype=fparam_std.dtype),
-                fparam_std,
+            if (
+                stat_file_path is not None
+                and stat_file_path.is_dir()
+                and (stat_file_path / "fparam").is_file()
+            ):
+                fparam_stats = self._load_param_stats_from_file(
+                    stat_file_path, "fparam", self.numb_fparam
+                )
+            else:
+                sampled = merged() if callable(merged) else merged
+                cat_data = np.concatenate(
+                    [frame["fparam"] for frame in sampled], axis=0
+                )
+                cat_data = np.reshape(cat_data, [-1, self.numb_fparam])
+                fparam_stats = [
+                    StatItem(
+                        number=cat_data.shape[0],
+                        sum=np.sum(cat_data[:, ii]),
+                        squared_sum=np.sum(cat_data[:, ii] ** 2),
+                    )
+                    for ii in range(self.numb_fparam)
+                ]
+                if stat_file_path is not None:
+                    self._save_param_stats_to_file(
+                        stat_file_path, "fparam", fparam_stats
+                    )
+            fparam_avg = np.array(
+                [s.compute_avg() for s in fparam_stats], dtype=np.float64
+            )
+            fparam_std = np.array(
+                [s.compute_std(protection=protection) for s in fparam_stats],
+                dtype=np.float64,
             )
             fparam_inv_std = 1.0 / fparam_std
-            # Use array_api_compat to handle both numpy and torch
             xp = array_api_compat.array_namespace(self.fparam_avg)
             self.fparam_avg = xp.asarray(
                 fparam_avg,
@@ -275,26 +303,47 @@ def compute_input_stats(
             )
         # stat aparam
         if self.numb_aparam > 0:
-            sys_sumv = []
-            sys_sumv2 = []
-            sys_sumn = []
-            for ss_ in [frame["aparam"] for frame in sampled]:
-                ss = np.reshape(ss_, [-1, self.numb_aparam])
-                sys_sumv.append(np.sum(ss, axis=0))
-                sys_sumv2.append(np.sum(ss * ss, axis=0))
-                sys_sumn.append(ss.shape[0])
-            sumv = np.sum(np.stack(sys_sumv), axis=0)
-            sumv2 = np.sum(np.stack(sys_sumv2), axis=0)
-            sumn = sum(sys_sumn)
-            aparam_avg = sumv / sumn
-            aparam_std = np.sqrt(sumv2 / sumn - (sumv / sumn) ** 2)
-            aparam_std = np.where(
-                aparam_std < protection,
-                np.array(protection, dtype=aparam_std.dtype),
-                aparam_std,
+            if (
+                stat_file_path is not None
+                and stat_file_path.is_dir()
+                and (stat_file_path / "aparam").is_file()
+            ):
+                aparam_stats = self._load_param_stats_from_file(
+                    stat_file_path, "aparam", self.numb_aparam
+                )
+            else:
+                sampled = merged() if callable(merged) else merged
+                sys_sumv = []
+                sys_sumv2 = []
+                sys_sumn = []
+                for ss_ in [frame["aparam"] for frame in sampled]:
+                    ss = np.reshape(ss_, [-1, self.numb_aparam])
+                    sys_sumv.append(np.sum(ss, axis=0))
+                    sys_sumv2.append(np.sum(ss * ss, axis=0))
+                    sys_sumn.append(ss.shape[0])
+                sumv = np.sum(np.stack(sys_sumv), axis=0)
+                sumv2 = np.sum(np.stack(sys_sumv2), axis=0)
+                sumn = sum(sys_sumn)
+                aparam_stats = [
+                    StatItem(
+                        number=sumn,
+                        sum=sumv[ii],
+                        squared_sum=sumv2[ii],
+                    )
+                    for ii in range(self.numb_aparam)
+                ]
+                if stat_file_path is not None:
+                    self._save_param_stats_to_file(
+                        stat_file_path, "aparam", aparam_stats
+                    )
+            aparam_avg = np.array(
+                [s.compute_avg() for s in aparam_stats], dtype=np.float64
+            )
+            aparam_std = np.array(
+                [s.compute_std(protection=protection) for s in aparam_stats],
+                dtype=np.float64,
             )
             aparam_inv_std = 1.0 / aparam_std
-            # Use array_api_compat to handle both numpy and torch
             xp = array_api_compat.array_namespace(self.aparam_avg)
             self.aparam_avg = xp.asarray(
                 aparam_avg,
@@ -307,6 +356,31 @@ def compute_input_stats(
                 device=array_api_compat.device(self.aparam_inv_std),
             )
 
+    @staticmethod
+    def _save_param_stats_to_file(
+        stat_file_path: DPPath,
+        name: str,
+        stats: list[StatItem],
+    ) -> None:
+        stat_file_path.mkdir(exist_ok=True, parents=True)
+        fp = stat_file_path / name
+        arr = np.array([[s.number, s.sum, s.squared_sum] for s in stats])
+        fp.save_numpy(arr)
+
+    @staticmethod
+    def _load_param_stats_from_file(
+        stat_file_path: DPPath,
+        name: str,
+        numb: int,
+    ) -> list[StatItem]:
+        fp = stat_file_path / name
+        arr = fp.load_numpy()
+        assert arr.shape == (numb, 3)
+        return [
+            StatItem(number=arr[ii][0], sum=arr[ii][1], squared_sum=arr[ii][2])
+            for ii in range(numb)
+        ]
+
     @abstractmethod
     def _net_out_dim(self) -> int:
         """Set the FittingNet output dim."""
diff --git a/deepmd/dpmodel/utils/stat.py b/deepmd/dpmodel/utils/stat.py
index 1cbaad0275..29ea128a91 100644
--- a/deepmd/dpmodel/utils/stat.py
+++ b/deepmd/dpmodel/utils/stat.py
@@ -14,6 +14,9 @@
 from deepmd.dpmodel.common import (
     to_numpy_array,
 )
+from deepmd.dpmodel.utils.exclude_mask import (
+    AtomExcludeMask,
+)
 from deepmd.utils.out_stat import (
     compute_stats_do_not_distinguish_types,
     compute_stats_from_atomic,
@@ -360,6 +363,12 @@ def compute_output_stats_global(
     }
 
     natoms_key = "natoms"
+    for system in sampled:
+        if "atom_exclude_types" in system:
+            type_mask = AtomExcludeMask(
+                ntypes, system["atom_exclude_types"]
+            ).get_type_mask()
+            system[natoms_key][:, 2:] *= type_mask.reshape(1, -1)
     input_natoms = {
         kk: [
             to_numpy_array(sampled[idx][natoms_key])
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index faabb0fc1e..a791c8af41 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1181,3 +1181,359 @@ def raise_error():
             np.testing.assert_allclose(
                 dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
             )
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+    (False, True),  # fparam_in_data
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestEnerComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd), fitting stats (fparam, aparam), and output bias.
+    Parameterized over exclusion types and whether fparam is explicitly provided or
+    injected via default_fparam.
+    """
+
+    def setUp(self) -> None:
+        (pair_exclude_types, atom_exclude_types), self.fparam_in_data = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "dpa3",
+                    "repflow": {
+                        "n_dim": 20,
+                        "e_dim": 10,
+                        "a_dim": 8,
+                        "nlayers": 3,
+                        "e_rcut": 6.0,
+                        "e_rcut_smth": 5.0,
+                        "e_sel": 10,
+                        "a_rcut": 4.0,
+                        "a_rcut_smth": 3.5,
+                        "a_sel": 8,
+                        "axis_neuron": 4,
+                        "update_angle": True,
+                        "update_style": "res_residual",
+                        "update_residual": 0.1,
+                        "update_residual_init": "const",
+                    },
+                    "precision": "float64",
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [10, 10],
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                    "default_fparam": [0.5, -0.3],
+                    "numb_aparam": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = EnergyModelPT.deserialize(serialized)
+        self.pt_expt_model = EnergyModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array([[natoms, natoms, 2, 4]] * nframes, dtype=np.int32)
+        energy_stat = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        aparam_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "energy": energy_stat,
+            "find_energy": np.float32(1.0),
+            "aparam": aparam_stat,
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "energy": numpy_to_torch(energy_stat),
+            "find_energy": np.float32(1.0),
+            "aparam": numpy_to_torch(aparam_stat),
+        }
+
+        if self.fparam_in_data:
+            fparam_stat = rng.normal(size=(nframes, 2)).astype(
+                GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["fparam"] = fparam_stat
+            pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
+        else:
+            # No fparam → _make_wrapped_sampler injects default_fparam
+            self.expected_fparam_avg = np.array([0.5, -0.3])
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        self.eval_aparam = rng.normal(size=(1, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(
+            self.coords, self.atype, box=self.box, aparam=self.eval_aparam
+        )
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                aparam=numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                aparam=pt_expt_numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
+        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
+        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 5. Non-triviality checks
+        fit_vars = dp_ser["fitting"]["@variables"]
+        # fparam stats were computed
+        fparam_avg = np.asarray(fit_vars["fparam_avg"])
+        self.assertFalse(
+            np.allclose(fparam_avg, 0.0),
+            "fparam_avg is still zero — fparam stats were not computed",
+        )
+        np.testing.assert_allclose(
+            fparam_avg,
+            self.expected_fparam_avg,
+            rtol=1e-10,
+            atol=1e-10,
+            err_msg="fparam_avg does not match expected values",
+        )
+        # aparam stats were computed
+        aparam_avg = np.asarray(fit_vars["aparam_avg"])
+        self.assertFalse(
+            np.allclose(aparam_avg, 0.0),
+            "aparam_avg is still zero — aparam stats were not computed",
+        )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file
+            self.dp_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(dp_h5, "a")
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: self.pt_sampled, stat_file_path=DPPath(pt_h5, "a")
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = EnergyModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = EnergyModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From 41af95950b005859d989730306aca66e2ff433fc Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 08:46:04 +0800
Subject: [PATCH 13/63] rm tmp test files

---
 source/tests/consistent/model/test_frozen.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/source/tests/consistent/model/test_frozen.py b/source/tests/consistent/model/test_frozen.py
index d7dfcfe735..d2c33f3cd9 100644
--- a/source/tests/consistent/model/test_frozen.py
+++ b/source/tests/consistent/model/test_frozen.py
@@ -1,5 +1,7 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+import glob
 import os
+import tempfile
 import unittest
 from typing import (
     Any,
@@ -57,6 +59,10 @@ def tearDownModule() -> None:
             os.remove(model_file)
         except FileNotFoundError:
             pass
+    # Clean up temporary .pb files created by TF FrozenModel
+    # (tempfile.NamedTemporaryFile(suffix=".pb", dir=os.curdir, delete=False))
+    for tmp_pb in glob.glob(tempfile.gettempprefix() + "*.pb"):
+        os.remove(tmp_pb)
 
 
 @parameterized((pt_model, tf_model, dp_model))

From 5a4a5d2649914c34932da00c744d0a8f5d9c54a9 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 09:33:23 +0800
Subject: [PATCH 14/63] remove concrete methods and data from BaseModel

---
 deepmd/dpmodel/model/base_model.py | 11 +++--------
 deepmd/dpmodel/model/make_model.py |  8 ++++++++
 deepmd/pt_expt/model/model.py      |  8 +-------
 3 files changed, 12 insertions(+), 15 deletions(-)

diff --git a/deepmd/dpmodel/model/base_model.py b/deepmd/dpmodel/model/base_model.py
index 163cd62387..b8efac8977 100644
--- a/deepmd/dpmodel/model/base_model.py
+++ b/deepmd/dpmodel/model/base_model.py
@@ -142,9 +142,10 @@ def get_model_def_script(self) -> str:
             """Get the model definition script."""
             pass
 
+        @abstractmethod
         def get_min_nbor_dist(self) -> float | None:
             """Get the minimum distance between two atoms."""
-            return self.min_nbor_dist
+            pass
 
         @abstractmethod
         def get_nnei(self) -> int:
@@ -255,10 +256,4 @@ class BaseModel(make_base_model()):
         Backend-independent BaseModel class.
     """
 
-    def __init__(self) -> None:
-        self.model_def_script = ""
-        self.min_nbor_dist = None
-
-    def get_model_def_script(self) -> str:
-        """Get the model definition script."""
-        return self.model_def_script
+    pass
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index f5387d7221..ae8d0de1cb 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -707,6 +707,14 @@ def compute_or_load_stat(
             """
             self.atomic_model.compute_or_load_stat(sampled_func, stat_file_path)
 
+        def get_model_def_script(self) -> str:
+            """Get the model definition script."""
+            return self.model_def_script
+
+        def get_min_nbor_dist(self) -> float | None:
+            """Get the minimum distance between two atoms."""
+            return self.min_nbor_dist
+
         def get_ntypes(self) -> int:
             """Get the number of types."""
             return len(self.get_type_map())
diff --git a/deepmd/pt_expt/model/model.py b/deepmd/pt_expt/model/model.py
index f7d8d86e14..83842eaabd 100644
--- a/deepmd/pt_expt/model/model.py
+++ b/deepmd/pt_expt/model/model.py
@@ -16,10 +16,4 @@ class BaseModel(make_base_model()):
         Backend-independent BaseModel class.
     """
 
-    def __init__(self) -> None:
-        self.model_def_script = ""
-        self.min_nbor_dist = None
-
-    def get_model_def_script(self) -> str:
-        """Get the model definition script."""
-        return self.model_def_script
+    pass

From 19f905872393ca47c82ee812cf5f36415a5c31bb Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 09:43:31 +0800
Subject: [PATCH 15/63] rm model_type

---
 deepmd/dpmodel/model/dipole_model.py | 2 --
 deepmd/dpmodel/model/dos_model.py    | 2 --
 deepmd/dpmodel/model/dp_zbl_model.py | 2 --
 deepmd/dpmodel/model/polar_model.py  | 2 --
 4 files changed, 8 deletions(-)

diff --git a/deepmd/dpmodel/model/dipole_model.py b/deepmd/dpmodel/model/dipole_model.py
index 9121321347..fa5a76e0af 100644
--- a/deepmd/dpmodel/model/dipole_model.py
+++ b/deepmd/dpmodel/model/dipole_model.py
@@ -28,8 +28,6 @@
 
 @BaseModel.register("dipole")
 class DipoleModel(DPModelCommon, DPDipoleModel_):
-    model_type = "dipole"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/dpmodel/model/dos_model.py b/deepmd/dpmodel/model/dos_model.py
index 54a5ba0ed2..b75c9a2bcc 100644
--- a/deepmd/dpmodel/model/dos_model.py
+++ b/deepmd/dpmodel/model/dos_model.py
@@ -28,8 +28,6 @@
 
 @BaseModel.register("dos")
 class DOSModel(DPModelCommon, DPDOSModel_):
-    model_type = "dos"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/dpmodel/model/dp_zbl_model.py b/deepmd/dpmodel/model/dp_zbl_model.py
index 289d81473a..d864b3b61e 100644
--- a/deepmd/dpmodel/model/dp_zbl_model.py
+++ b/deepmd/dpmodel/model/dp_zbl_model.py
@@ -31,8 +31,6 @@
 
 @BaseModel.register("zbl")
 class DPZBLModel(DPZBLModel_):
-    model_type = "zbl"
-
     def __init__(
         self,
         *args: Any,
diff --git a/deepmd/dpmodel/model/polar_model.py b/deepmd/dpmodel/model/polar_model.py
index ad5a47726e..5031166a5e 100644
--- a/deepmd/dpmodel/model/polar_model.py
+++ b/deepmd/dpmodel/model/polar_model.py
@@ -28,8 +28,6 @@
 
 @BaseModel.register("polar")
 class PolarModel(DPModelCommon, DPPolarModel_):
-    model_type = "polar"
-
     def __init__(
         self,
         *args: Any,

From 26b0a40e1b63c6e6940d18b8302eac5b8a12f174 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 09:46:05 +0800
Subject: [PATCH 16/63] fix spin model

---
 deepmd/dpmodel/model/spin_model.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/deepmd/dpmodel/model/spin_model.py b/deepmd/dpmodel/model/spin_model.py
index 482b61f7be..b72acf5ce5 100644
--- a/deepmd/dpmodel/model/spin_model.py
+++ b/deepmd/dpmodel/model/spin_model.py
@@ -17,6 +17,9 @@
 from deepmd.dpmodel.common import (
     NativeOP,
 )
+from deepmd.dpmodel.model.base_model import (
+    BaseModel,
+)
 from deepmd.dpmodel.model.make_model import (
     make_model,
 )
@@ -326,9 +329,9 @@ def serialize(self) -> dict:
 
     @classmethod
     def deserialize(cls, data: dict) -> "SpinModel":
-        backbone_model_obj = make_model(DPAtomicModel, T_Bases=(NativeOP,)).deserialize(
-            data["backbone_model"]
-        )
+        backbone_model_obj = make_model(
+            DPAtomicModel, T_Bases=(NativeOP, BaseModel)
+        ).deserialize(data["backbone_model"])
         spin = Spin.deserialize(data["spin"])
         return cls(
             backbone_model=backbone_model_obj,

From eecd82bef299aad2b1b234fdae797013c8d74353 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 12:12:44 +0800
Subject: [PATCH 17/63] add get_observed_type_list to abstract API and
 implement in dpmodel

  Move get_observed_type_list from a PT-only method to a backend-independent
  abstract API on BaseBaseModel, with a concrete implementation in dpmodel's
  make_model CM using array_api_compat for torch compatibility. Add a
  cross-backend consistency test that verifies dp, pt, and pt_expt return
  identical results when only a subset of types is observed.
---
 deepmd/dpmodel/model/base_model.py         | 11 +++++
 deepmd/dpmodel/model/make_model.py         | 19 ++++++++
 source/tests/consistent/model/test_ener.py | 51 ++++++++++++++++++++++
 3 files changed, 81 insertions(+)

diff --git a/deepmd/dpmodel/model/base_model.py b/deepmd/dpmodel/model/base_model.py
index b8efac8977..d87c0eb5b7 100644
--- a/deepmd/dpmodel/model/base_model.py
+++ b/deepmd/dpmodel/model/base_model.py
@@ -191,6 +191,17 @@ def update_sel(
             cls = cls.get_class_by_type(model_type)
             return cls.update_sel(train_data, type_map, local_jdata)
 
+        @abstractmethod
+        def get_observed_type_list(self) -> list[str]:
+            """Get observed types (elements) of the model during data statistics.
+
+            Returns
+            -------
+            list[str]
+                A list of the observed type names in this model.
+            """
+            pass
+
         def enable_compression(
             self,
             table_extrapolate: float = 5,
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index ae8d0de1cb..debab272f3 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -378,6 +378,25 @@ def get_out_bias(self) -> Array:
             """Get the output bias."""
             return self.atomic_model.out_bias
 
+        def get_observed_type_list(self) -> list[str]:
+            """Get observed types (elements) of the model during data statistics.
+
+            Returns
+            -------
+            list[str]
+                A list of the observed type names in this model.
+            """
+            type_map = self.get_type_map()
+            out_bias = self.get_out_bias()[0]
+            assert out_bias is not None, "No out_bias found in the model."
+            assert out_bias.ndim == 2, "The supported out_bias should be a 2D array."
+            assert out_bias.shape[0] == len(type_map), (
+                "The out_bias shape does not match the type_map length."
+            )
+            xp = array_api_compat.array_namespace(out_bias)
+            bias_mask = xp.any(xp.abs(out_bias) > 1e-6, axis=-1)
+            return [type_map[i] for i in range(len(type_map)) if bias_mask[i]]
+
         def set_out_bias(self, out_bias: Array) -> None:
             """Set the output bias."""
             self.atomic_model.out_bias = out_bias
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index a791c8af41..40c34a8836 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1182,6 +1182,57 @@ def raise_error():
                 dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
             )
 
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that type 1 ("H") is
+        unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — type 1 is unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[natoms, natoms, natoms, 0]] * nframes, dtype=np.int32)
+        energy_data = np.array([10.0, 20.0]).reshape(nframes, 1)
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "energy": energy_data,
+                "find_energy": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "energy": numpy_to_torch(energy_data),
+                "find_energy": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # Only type 0 ("O") should be observed
+        self.assertEqual(dp_observed, ["O"])
+
 
 def _compare_variables_recursive(
     d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10

From aba2d71264f142dd7034ec28079562b439670a1e Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 13:28:24 +0800
Subject: [PATCH 18/63] fix: dpmodel change_type_map drops
 model_with_new_type_stat and uses bare np ops

  dpmodel's model-level change_type_map was not forwarding
  model_with_new_type_stat to the atomic model, so fine-tuning with new
  atom types would silently lose reference statistics. Align with the pt
  backend by unwrapping .atomic_model and passing it through.

  Also fix array API violations in fitting change_type_map methods:
  np.zeros/np.ones/np.concatenate fail when arrays are torch tensors
  (pt_expt backend). Replace with xp.zeros/xp.ones/xp.concat using
  proper array namespace and device.

  Add cross-backend test (test_change_type_map_extend_stat) that
  exercises the model-level change_type_map with
  model_with_new_type_stat across dp, pt, and pt_expt.
---
 deepmd/dpmodel/fitting/general_fitting.py     |   9 +-
 .../dpmodel/fitting/polarizability_fitting.py |  17 ++-
 deepmd/dpmodel/model/make_model.py            |   9 +-
 source/tests/consistent/model/test_ener.py    | 116 ++++++++++++++++++
 4 files changed, 141 insertions(+), 10 deletions(-)

diff --git a/deepmd/dpmodel/fitting/general_fitting.py b/deepmd/dpmodel/fitting/general_fitting.py
index d82421cc8d..c7372f05ac 100644
--- a/deepmd/dpmodel/fitting/general_fitting.py
+++ b/deepmd/dpmodel/fitting/general_fitting.py
@@ -437,11 +437,14 @@ def change_type_map(
         self.ntypes = len(type_map)
         self.reinit_exclude(map_atom_exclude_types(self.exclude_types, remap_index))
         if has_new_type:
+            xp = array_api_compat.array_namespace(self.bias_atom_e)
             extend_shape = [len(type_map), *list(self.bias_atom_e.shape[1:])]
-            extend_bias_atom_e = np.zeros(extend_shape, dtype=self.bias_atom_e.dtype)
-            self.bias_atom_e = np.concatenate(
-                [self.bias_atom_e, extend_bias_atom_e], axis=0
+            extend_bias_atom_e = xp.zeros(
+                extend_shape,
+                dtype=self.bias_atom_e.dtype,
+                device=array_api_compat.device(self.bias_atom_e),
             )
+            self.bias_atom_e = xp.concat([self.bias_atom_e, extend_bias_atom_e], axis=0)
         self.bias_atom_e = self.bias_atom_e[remap_index]
 
     def __setitem__(self, key: str, value: Any) -> None:
diff --git a/deepmd/dpmodel/fitting/polarizability_fitting.py b/deepmd/dpmodel/fitting/polarizability_fitting.py
index dff86f04cb..28c93cdadc 100644
--- a/deepmd/dpmodel/fitting/polarizability_fitting.py
+++ b/deepmd/dpmodel/fitting/polarizability_fitting.py
@@ -237,14 +237,21 @@ def change_type_map(
         remap_index, has_new_type = get_index_between_two_maps(self.type_map, type_map)
         super().change_type_map(type_map=type_map)
         if has_new_type:
+            xp = array_api_compat.array_namespace(self.scale)
             extend_shape = [len(type_map), *list(self.scale.shape[1:])]
-            extend_scale = np.ones(extend_shape, dtype=self.scale.dtype)
-            self.scale = np.concatenate([self.scale, extend_scale], axis=0)
+            extend_scale = xp.ones(
+                extend_shape,
+                dtype=self.scale.dtype,
+                device=array_api_compat.device(self.scale),
+            )
+            self.scale = xp.concat([self.scale, extend_scale], axis=0)
             extend_shape = [len(type_map), *list(self.constant_matrix.shape[1:])]
-            extend_constant_matrix = np.zeros(
-                extend_shape, dtype=self.constant_matrix.dtype
+            extend_constant_matrix = xp.zeros(
+                extend_shape,
+                dtype=self.constant_matrix.dtype,
+                device=array_api_compat.device(self.constant_matrix),
             )
-            self.constant_matrix = np.concatenate(
+            self.constant_matrix = xp.concat(
                 [self.constant_matrix, extend_constant_matrix], axis=0
             )
         self.scale = self.scale[remap_index]
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index ae8d0de1cb..817d8e30fc 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -597,12 +597,17 @@ def do_grad_c(
             return self.atomic_model.do_grad_c(var_name)
 
         def change_type_map(
-            self, type_map: list[str], model_with_new_type_stat: Any = None
+            self, type_map: list[str], model_with_new_type_stat: Any | None = None
         ) -> None:
             """Change the type related params to new ones, according to `type_map` and the original one in the model.
             If there are new types in `type_map`, statistics will be updated accordingly to `model_with_new_type_stat` for these new types.
             """
-            self.atomic_model.change_type_map(type_map=type_map)
+            self.atomic_model.change_type_map(
+                type_map=type_map,
+                model_with_new_type_stat=model_with_new_type_stat.atomic_model
+                if model_with_new_type_stat is not None
+                else None,
+            )
 
         def serialize(self) -> dict:
             return self.atomic_model.serialize()
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index a791c8af41..12308cb0d1 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1002,6 +1002,122 @@ def test_change_type_map(self) -> None:
             atol=1e-10,
         )
 
+    def test_change_type_map_extend_stat(self) -> None:
+        """change_type_map with model_with_new_type_stat should propagate stats consistently across dp, pt, and pt_expt.
+
+        Verifies that the model-level change_type_map correctly unwraps
+        model_with_new_type_stat.atomic_model before forwarding to the
+        atomic model.
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        small_tm = ["O", "H"]
+        large_tm = ["O", "H", "Li"]
+
+        small_data = model_args_fn().normalize_value(
+            {
+                "type_map": small_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        large_data = model_args_fn().normalize_value(
+            {
+                "type_map": large_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 2,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        dp_small = get_model_dp(small_data)
+        dp_large = get_model_dp(large_data)
+
+        # Set distinguishable random stats on the large model's descriptor
+        rng = np.random.default_rng(42)
+        desc_large = dp_large.get_descriptor()
+        mean_large, std_large = desc_large.get_stat_mean_and_stddev()
+        mean_rand = rng.random(size=to_numpy_array(mean_large).shape)
+        std_rand = rng.random(size=to_numpy_array(std_large).shape)
+        desc_large.set_stat_mean_and_stddev(mean_rand, std_rand)
+
+        # Build pt and pt_expt models from dp serialization
+        pt_small = EnergyModelPT.deserialize(dp_small.serialize())
+        pt_large = EnergyModelPT.deserialize(dp_large.serialize())
+        pt_expt_small = EnergyModelPTExpt.deserialize(dp_small.serialize())
+        pt_expt_large = EnergyModelPTExpt.deserialize(dp_large.serialize())
+
+        # Extend type map with model_with_new_type_stat at the model level
+        dp_small.change_type_map(large_tm, model_with_new_type_stat=dp_large)
+        pt_small.change_type_map(large_tm, model_with_new_type_stat=pt_large)
+        pt_expt_small.change_type_map(large_tm, model_with_new_type_stat=pt_expt_large)
+
+        # Descriptor stats should be consistent across backends
+        dp_mean, dp_std = dp_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_mean, pt_std = pt_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_expt_mean, pt_expt_std = (
+            pt_expt_small.get_descriptor().get_stat_mean_and_stddev()
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            torch_to_numpy(pt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            torch_to_numpy(pt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            to_numpy_array(pt_expt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            to_numpy_array(pt_expt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
     def test_update_sel(self) -> None:
         """update_sel should return the same result on dp and pt."""
         from unittest.mock import (

From 21dc4e768bce0c6104407698037491295fdc681e Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 13:29:27 +0800
Subject: [PATCH 19/63] consolidate get_out_bias/set_out_bias into
 base_atomic_model

  Add get_out_bias() and set_out_bias() methods to dpmodel's
  base_atomic_model, and update make_model to call them instead of
  accessing the attribute directly. For PT, add get_out_bias() to
  base_atomic_model and remove the redundant implementations from
  dp_atomic_model, pairtab_atomic_model, and linear_atomic_model.
---
 deepmd/dpmodel/atomic_model/base_atomic_model.py     | 8 ++++++++
 deepmd/dpmodel/model/make_model.py                   | 4 ++--
 deepmd/pt/model/atomic_model/base_atomic_model.py    | 5 +++++
 deepmd/pt/model/atomic_model/dp_atomic_model.py      | 3 ---
 deepmd/pt/model/atomic_model/linear_atomic_model.py  | 3 ---
 deepmd/pt/model/atomic_model/pairtab_atomic_model.py | 3 ---
 6 files changed, 15 insertions(+), 11 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/base_atomic_model.py b/deepmd/dpmodel/atomic_model/base_atomic_model.py
index 748daad405..9d2a446831 100644
--- a/deepmd/dpmodel/atomic_model/base_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/base_atomic_model.py
@@ -78,6 +78,14 @@ def init_out_stat(self) -> None:
         self.out_bias = out_bias_data
         self.out_std = out_std_data
 
+    def get_out_bias(self) -> Array:
+        """Get the output bias."""
+        return self.out_bias
+
+    def set_out_bias(self, out_bias: Array) -> None:
+        """Set the output bias."""
+        self.out_bias = out_bias
+
     def __setitem__(self, key: str, value: Array) -> None:
         if key in ["out_bias"]:
             self.out_bias = value
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index debab272f3..fedb4b75a8 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -376,7 +376,7 @@ def forward_common_atomic(
 
         def get_out_bias(self) -> Array:
             """Get the output bias."""
-            return self.atomic_model.out_bias
+            return self.atomic_model.get_out_bias()
 
         def get_observed_type_list(self) -> list[str]:
             """Get observed types (elements) of the model during data statistics.
@@ -399,7 +399,7 @@ def get_observed_type_list(self) -> list[str]:
 
         def set_out_bias(self, out_bias: Array) -> None:
             """Set the output bias."""
-            self.atomic_model.out_bias = out_bias
+            self.atomic_model.set_out_bias(out_bias)
 
         def change_out_bias(
             self,
diff --git a/deepmd/pt/model/atomic_model/base_atomic_model.py b/deepmd/pt/model/atomic_model/base_atomic_model.py
index 0ccf539757..ee68718230 100644
--- a/deepmd/pt/model/atomic_model/base_atomic_model.py
+++ b/deepmd/pt/model/atomic_model/base_atomic_model.py
@@ -104,7 +104,12 @@ def init_out_stat(self) -> None:
         self.register_buffer("out_bias", out_bias_data)
         self.register_buffer("out_std", out_std_data)
 
+    def get_out_bias(self) -> torch.Tensor:
+        """Get the output bias."""
+        return self.out_bias
+
     def set_out_bias(self, out_bias: torch.Tensor) -> None:
+        """Set the output bias."""
         self.out_bias = out_bias
 
     def __setitem__(self, key: str, value: torch.Tensor) -> None:
diff --git a/deepmd/pt/model/atomic_model/dp_atomic_model.py b/deepmd/pt/model/atomic_model/dp_atomic_model.py
index a71427d5e9..78fa0c3cf7 100644
--- a/deepmd/pt/model/atomic_model/dp_atomic_model.py
+++ b/deepmd/pt/model/atomic_model/dp_atomic_model.py
@@ -299,9 +299,6 @@ def forward_atomic(
             )
         return fit_ret
 
-    def get_out_bias(self) -> torch.Tensor:
-        return self.out_bias
-
     def compute_or_load_stat(
         self,
         sampled_func: Callable[[], list[dict]],
diff --git a/deepmd/pt/model/atomic_model/linear_atomic_model.py b/deepmd/pt/model/atomic_model/linear_atomic_model.py
index 96b3baf6ec..de3acfcaca 100644
--- a/deepmd/pt/model/atomic_model/linear_atomic_model.py
+++ b/deepmd/pt/model/atomic_model/linear_atomic_model.py
@@ -126,9 +126,6 @@ def need_sorted_nlist_for_lower(self) -> bool:
         """Returns whether the atomic model needs sorted nlist when using `forward_lower`."""
         return True
 
-    def get_out_bias(self) -> torch.Tensor:
-        return self.out_bias
-
     def get_rcut(self) -> float:
         """Get the cut-off radius."""
         return max(self.get_model_rcuts())
diff --git a/deepmd/pt/model/atomic_model/pairtab_atomic_model.py b/deepmd/pt/model/atomic_model/pairtab_atomic_model.py
index a77e5391f8..4424509776 100644
--- a/deepmd/pt/model/atomic_model/pairtab_atomic_model.py
+++ b/deepmd/pt/model/atomic_model/pairtab_atomic_model.py
@@ -131,9 +131,6 @@ def fitting_output_def(self) -> FittingOutputDef:
             ]
         )
 
-    def get_out_bias(self) -> torch.Tensor:
-        return self.out_bias
-
     def get_rcut(self) -> float:
         return self.rcut
 

From 61722b9c5d12dcffcdaf25c697180db918967282 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 14:40:56 +0800
Subject: [PATCH 20/63] change fitting -> fitting_net

---
 .../dpmodel/atomic_model/dp_atomic_model.py   | 30 ++++++++++---------
 .../atomic_model/polar_atomic_model.py        |  4 +--
 deepmd/dpmodel/model/dp_model.py              |  2 +-
 3 files changed, 19 insertions(+), 17 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index f110e58d2c..804ec9c4bb 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -56,15 +56,15 @@ def __init__(
         super().__init__(type_map, **kwargs)
         self.type_map = type_map
         self.descriptor = descriptor
-        self.fitting = fitting
-        if hasattr(self.fitting, "reinit_exclude"):
-            self.fitting.reinit_exclude(self.atom_exclude_types)
+        self.fitting_net = fitting
+        if hasattr(self.fitting_net, "reinit_exclude"):
+            self.fitting_net.reinit_exclude(self.atom_exclude_types)
         self.type_map = type_map
         super().init_out_stat()
 
     def fitting_output_def(self) -> FittingOutputDef:
         """Get the output def of the fitting net."""
-        return self.fitting.output_def()
+        return self.fitting_net.output_def()
 
     def get_rcut(self) -> float:
         """Get the cut-off radius."""
@@ -79,7 +79,7 @@ def set_case_embd(self, case_idx: int) -> None:
         Set the case embedding of this atomic model by the given case_idx,
         typically concatenated with the output of the descriptor and fed into the fitting net.
         """
-        self.fitting.set_case_embd(case_idx)
+        self.fitting_net.set_case_embd(case_idx)
 
     def mixed_types(self) -> bool:
         """If true, the model
@@ -172,7 +172,7 @@ def forward_atomic(
             nlist,
             mapping=mapping,
         )
-        ret = self.fitting(
+        ret = self.fitting_net(
             descriptor,
             atype,
             gr=rot_mat,
@@ -208,7 +208,9 @@ def compute_or_load_stat(
 
         wrapped_sampler = self._make_wrapped_sampler(sampled_func)
         self.descriptor.compute_input_stats(wrapped_sampler, stat_file_path)
-        self.fitting.compute_input_stats(wrapped_sampler, stat_file_path=stat_file_path)
+        self.fitting_net.compute_input_stats(
+            wrapped_sampler, stat_file_path=stat_file_path
+        )
         if compute_or_load_out_stat:
             self.compute_or_load_out_stat(wrapped_sampler, stat_file_path)
 
@@ -228,7 +230,7 @@ def change_type_map(
             if model_with_new_type_stat is not None
             else None,
         )
-        self.fitting.change_type_map(type_map=type_map)
+        self.fitting_net.change_type_map(type_map=type_map)
 
     def serialize(self) -> dict:
         dd = super().serialize()
@@ -239,7 +241,7 @@ def serialize(self) -> dict:
                 "@version": 2,
                 "type_map": self.type_map,
                 "descriptor": self.descriptor.serialize(),
-                "fitting": self.fitting.serialize(),
+                "fitting": self.fitting_net.serialize(),
             }
         )
         return dd
@@ -265,19 +267,19 @@ def deserialize(cls, data: dict[str, Any]) -> "DPAtomicModel":
 
     def get_dim_fparam(self) -> int:
         """Get the number (dimension) of frame parameters of this atomic model."""
-        return self.fitting.get_dim_fparam()
+        return self.fitting_net.get_dim_fparam()
 
     def get_dim_aparam(self) -> int:
         """Get the number (dimension) of atomic parameters of this atomic model."""
-        return self.fitting.get_dim_aparam()
+        return self.fitting_net.get_dim_aparam()
 
     def has_default_fparam(self) -> bool:
         """Check if the model has default frame parameters."""
-        return self.fitting.has_default_fparam()
+        return self.fitting_net.has_default_fparam()
 
     def get_default_fparam(self) -> list[float] | None:
         """Get the default frame parameters."""
-        return self.fitting.get_default_fparam()
+        return self.fitting_net.get_default_fparam()
 
     def get_sel_type(self) -> list[int]:
         """Get the selected atom types of this model.
@@ -286,7 +288,7 @@ def get_sel_type(self) -> list[int]:
         to the result of the model.
         If returning an empty list, all atom types are selected.
         """
-        return self.fitting.get_sel_type()
+        return self.fitting_net.get_sel_type()
 
     def is_aparam_nall(self) -> bool:
         """Check whether the shape of atomic parameters is (nframes, nall, ndim).
diff --git a/deepmd/dpmodel/atomic_model/polar_atomic_model.py b/deepmd/dpmodel/atomic_model/polar_atomic_model.py
index fd32f26e5e..8f7f1bd4b1 100644
--- a/deepmd/dpmodel/atomic_model/polar_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/polar_atomic_model.py
@@ -45,7 +45,7 @@ def apply_out_stat(
         xp = array_api_compat.array_namespace(atype)
         out_bias, out_std = self._fetch_out_stat(self.bias_keys)
 
-        if self.fitting.shift_diag:
+        if self.fitting_net.shift_diag:
             nframes, nloc = atype.shape
             dtype = out_bias[self.bias_keys[0]].dtype
             for kk in self.bias_keys:
@@ -58,7 +58,7 @@ def apply_out_stat(
 
                 # (nframes, nloc, 1)
                 modified_bias = (
-                    modified_bias[..., xp.newaxis] * (self.fitting.scale[atype])
+                    modified_bias[..., xp.newaxis] * (self.fitting_net.scale[atype])
                 )
 
                 eye = xp.eye(3, dtype=dtype, device=array_api_compat.device(atype))
diff --git a/deepmd/dpmodel/model/dp_model.py b/deepmd/dpmodel/model/dp_model.py
index 0dcf6358f9..e6e60d21a8 100644
--- a/deepmd/dpmodel/model/dp_model.py
+++ b/deepmd/dpmodel/model/dp_model.py
@@ -47,7 +47,7 @@ def update_sel(
 
     def get_fitting_net(self) -> BaseFitting:
         """Get the fitting network."""
-        return self.atomic_model.fitting
+        return self.atomic_model.fitting_net
 
     def get_descriptor(self) -> BaseDescriptor:
         """Get the descriptor."""

From c41515ae05979c8baeb04187e95fca91cf71db89 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 15:20:08 +0800
Subject: [PATCH 21/63] fix: dpmodel change_out_bias missing
 compute_fitting_input_stat for set-by-statistic

  The PT backend calls atomic_model.compute_fitting_input_stat(merged) in
  change_out_bias when mode is set-by-statistic, but dpmodel/pt_expt did
  not. This meant fparam/aparam statistics (avg, inv_std) were never updated
  during bias adjustment in these backends.

  Add compute_fitting_input_stat to dpmodel's DPAtomicModel and call it
  from make_model.change_out_bias. Enhance test_change_out_bias with
  fparam/aparam data, pt_expt coverage, and verification that fitting input
  stats are updated after set-by-statistic but unchanged after
  change-by-statistic.
---
 .../dpmodel/atomic_model/base_atomic_model.py |   2 +
 .../dpmodel/atomic_model/dp_atomic_model.py   |  24 +++
 deepmd/dpmodel/model/make_model.py            |   2 +
 source/tests/consistent/model/test_ener.py    | 151 ++++++++++++++++--
 4 files changed, 166 insertions(+), 13 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/base_atomic_model.py b/deepmd/dpmodel/atomic_model/base_atomic_model.py
index 748daad405..68a92aebd7 100644
--- a/deepmd/dpmodel/atomic_model/base_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/base_atomic_model.py
@@ -53,6 +53,7 @@ def __init__(
         pair_exclude_types: list[tuple[int, int]] = [],
         rcond: float | None = None,
         preset_out_bias: dict[str, Array] | None = None,
+        data_stat_protect: float = 1e-2,
     ) -> None:
         super().__init__()
         self.type_map = type_map
@@ -60,6 +61,7 @@ def __init__(
         self.reinit_pair_exclude(pair_exclude_types)
         self.rcond = rcond
         self.preset_out_bias = preset_out_bias
+        self.data_stat_protect = data_stat_protect
 
     def init_out_stat(self) -> None:
         """Initialize the output bias."""
diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index f110e58d2c..e322fcef2c 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -230,6 +230,30 @@ def change_type_map(
         )
         self.fitting.change_type_map(type_map=type_map)
 
+    def compute_fitting_input_stat(
+        self,
+        sample_merged: Callable[[], list[dict]] | list[dict],
+        stat_file_path: DPPath | None = None,
+    ) -> None:
+        """Compute the input statistics (e.g. mean and stddev) for the fittings from packed data.
+
+        Parameters
+        ----------
+        sample_merged : Union[Callable[[], list[dict]], list[dict]]
+            - list[dict]: A list of data samples from various data systems.
+                Each element, ``merged[i]``, is a data dictionary containing
+                ``keys``: ``np.ndarray`` originating from the ``i``-th data system.
+            - Callable[[], list[dict]]: A lazy function that returns data samples
+                in the above format only when needed.
+        stat_file_path : Optional[DPPath]
+            The path to the stat file.
+        """
+        self.fitting.compute_input_stats(
+            sample_merged,
+            protection=self.data_stat_protect,
+            stat_file_path=stat_file_path,
+        )
+
     def serialize(self) -> dict:
         dd = super().serialize()
         dd.update(
diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index 817d8e30fc..01576d64c1 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -398,6 +398,8 @@ def change_out_bias(
                 'change-by-statistic' or 'set-by-statistic'.
             """
             self.atomic_model.change_out_bias(merged, bias_adjust_mode=bias_adjust_mode)
+            if bias_adjust_mode == "set-by-statistic":
+                self.atomic_model.compute_fitting_input_stat(merged)
 
         def _input_type_cast(
             self,
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 12308cb0d1..6ce4f5d0e9 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -580,6 +580,9 @@ def setUp(self) -> None:
                     "resnet_dt": True,
                     "precision": "float64",
                     "seed": 1,
+                    "numb_fparam": 2,
+                    "numb_aparam": 3,
+                    "default_fparam": [0.5, -0.3],
                 },
             },
             trim_pattern="_*",
@@ -643,6 +646,12 @@ def setUp(self) -> None:
         self.mapping = mapping
         self.nlist = nlist
 
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        rng = np.random.default_rng(42)
+        self.eval_aparam = rng.normal(size=(1, nloc, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -779,12 +788,12 @@ def test_need_sorted_nlist_for_lower(self) -> None:
     def test_get_dim_fparam(self) -> None:
         """get_dim_fparam should return the same value on dp and pt."""
         self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
-        self.assertEqual(self.dp_model.get_dim_fparam(), 0)
+        self.assertEqual(self.dp_model.get_dim_fparam(), 2)
 
     def test_get_dim_aparam(self) -> None:
         """get_dim_aparam should return the same value on dp and pt."""
         self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
-        self.assertEqual(self.dp_model.get_dim_aparam(), 0)
+        self.assertEqual(self.dp_model.get_dim_aparam(), 3)
 
     def test_get_sel_type(self) -> None:
         """get_sel_type should return the same list on dp and pt."""
@@ -831,12 +840,14 @@ def test_forward_common_atomic(self) -> None:
             self.extended_atype,
             self.nlist,
             mapping=self.mapping,
+            aparam=self.eval_aparam,
         )
         pt_ret = self.pt_model.atomic_model.forward_common_atomic(
             numpy_to_torch(self.extended_coord),
             numpy_to_torch(self.extended_atype),
             numpy_to_torch(self.nlist),
             mapping=numpy_to_torch(self.mapping),
+            aparam=numpy_to_torch(self.eval_aparam),
         )
         # Compare the common keys
         common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
@@ -857,26 +868,53 @@ def test_has_default_fparam(self) -> None:
             self.dp_model.has_default_fparam(),
             self.pt_model.has_default_fparam(),
         )
-        self.assertFalse(self.dp_model.has_default_fparam())
+        self.assertTrue(self.dp_model.has_default_fparam())
 
     def test_get_default_fparam(self) -> None:
-        """get_default_fparam should return None on both dp and pt (no fparam configured)."""
+        """get_default_fparam should return consistent values on dp and pt."""
         dp_val = self.dp_model.get_default_fparam()
         pt_val = self.pt_model.get_default_fparam()
-        self.assertIsNone(dp_val)
-        self.assertIsNone(pt_val)
-        # Note: both return None because no default_fparam is configured.
-        # A non-trivial return requires configuring default_fparam in the fitting net.
+        np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
+
+    def _get_fitting_stats(self, model, backend="dp"):
+        """Extract fparam/aparam stats from a model's fitting net."""
+        fitting = model.get_fitting_net()
+        if backend == "pt":
+            return {
+                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
+                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
+                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
+                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
+            }
+        else:
+            return {
+                "fparam_avg": to_numpy_array(fitting.fparam_avg),
+                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
+                "aparam_avg": to_numpy_array(fitting.aparam_avg),
+                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
+            }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias on dp and pt."""
+        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt."""
         nframes = 2
+        nloc = 6
+        numb_fparam = 2
+        numb_aparam = 3
+        rng = np.random.default_rng(123)
+
         # Use realistic coords (from setUp, tiled for 2 frames)
         coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
         atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
         box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
         natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
         energy_data = np.array([10.0, 20.0]).reshape(nframes, 1)
+        fparam_data = rng.normal(size=(nframes, numb_fparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        aparam_data = rng.normal(size=(nframes, nloc, numb_aparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
 
         # dpmodel stat data (numpy)
         dp_merged = [
@@ -888,6 +926,8 @@ def test_change_out_bias(self) -> None:
                 "natoms": natoms_data,
                 "energy": energy_data,
                 "find_energy": np.float32(1.0),
+                "fparam": fparam_data,
+                "aparam": aparam_data,
             }
         ]
         # pt stat data (torch tensors)
@@ -900,37 +940,122 @@ def test_change_out_bias(self) -> None:
                 "natoms": numpy_to_torch(natoms_data),
                 "energy": numpy_to_torch(energy_data),
                 "find_energy": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam_data),
+                "aparam": numpy_to_torch(aparam_data),
             }
         ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # Save initial fitting stats (all zeros / ones)
+        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
 
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
-        # Test "set-by-statistic" mode
+        # --- Test "set-by-statistic" mode ---
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
         self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
+        )
+
+        # Verify out bias consistency
         dp_bias = to_numpy_array(self.dp_model.get_out_bias())
         pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
-        # Verify bias actually changed from initial zeros
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
         self.assertFalse(
             np.allclose(dp_bias, dp_bias_init),
             "set-by-statistic did not change the bias from initial values",
         )
 
-        # Test "change-by-statistic" mode (adjusts bias based on model predictions)
+        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
+        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
+            )
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
+            )
+        # Verify fparam/aparam stats actually changed from initial values
+        self.assertFalse(
+            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
+            "set-by-statistic did not update fparam_avg",
+        )
+        self.assertFalse(
+            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
+            "set-by-statistic did not update aparam_avg",
+        )
+
+        # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
         self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
         dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
         pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
-        # Verify change-by-statistic further modified the bias
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
         self.assertFalse(
             np.allclose(dp_bias2, dp_bias_before),
             "change-by-statistic did not further change the bias",
         )
 
+        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
+        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_chg[stat_key],
+                dp_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pt_stats_chg[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pe_stats_chg[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
+            )
+
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 

From 3827a9cb58a452cf102a590ef660b56c1f12a557 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 15:43:48 +0800
Subject: [PATCH 22/63] fix bug

---
 deepmd/dpmodel/atomic_model/dp_atomic_model.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index b185dd8c59..a02536b18b 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -250,7 +250,7 @@ def compute_fitting_input_stat(
         stat_file_path : Optional[DPPath]
             The path to the stat file.
         """
-        self.fitting.compute_input_stats(
+        self.fitting_net.compute_input_stats(
             sample_merged,
             protection=self.data_stat_protect,
             stat_file_path=stat_file_path,

From 9e926bf2f971cc976d7dba552cb21961136730cc Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 16:49:03 +0800
Subject: [PATCH 23/63] fix bug

---
 source/tests/common/dpmodel/test_dp_atomic_model.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/source/tests/common/dpmodel/test_dp_atomic_model.py b/source/tests/common/dpmodel/test_dp_atomic_model.py
index 8ebd214865..ae5a9c610d 100644
--- a/source/tests/common/dpmodel/test_dp_atomic_model.py
+++ b/source/tests/common/dpmodel/test_dp_atomic_model.py
@@ -109,7 +109,7 @@ def test_excl_consistency(self) -> None:
             md0.reinit_pair_exclude(pair_excl)
             # hacking!
             md1.descriptor.reinit_exclude(pair_excl)
-            md1.fitting.reinit_exclude(atom_excl)
+            md1.fitting_net.reinit_exclude(atom_excl)
 
             # check energy consistency
             args = [self.coord_ext, self.atype_ext, self.nlist]

From f1dbd4f8d6a62700dba57990b5e4c47b38c81806 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 17:01:41 +0800
Subject: [PATCH 24/63] add missing get_observed_type_list to paddel

---
 deepmd/pd/model/model/make_model.py | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/deepmd/pd/model/model/make_model.py b/deepmd/pd/model/model/make_model.py
index 321c939061..1f46cb98c7 100644
--- a/deepmd/pd/model/model/make_model.py
+++ b/deepmd/pd/model/model/make_model.py
@@ -202,6 +202,24 @@ def forward_common(
         def get_out_bias(self) -> paddle.Tensor:
             return self.atomic_model.get_out_bias()
 
+        def get_observed_type_list(self) -> list[str]:
+            """Get observed types (elements) of the model during data statistics.
+
+            Returns
+            -------
+            list[str]
+                A list of the observed type names in this model.
+            """
+            type_map = self.get_type_map()
+            out_bias = self.get_out_bias()[0]
+            assert out_bias is not None, "No out_bias found in the model."
+            assert out_bias.ndim == 2, "The supported out_bias should be a 2D array."
+            assert out_bias.shape[0] == len(type_map), (
+                "The out_bias shape does not match the type_map length."
+            )
+            bias_mask = paddle.any(paddle.abs(out_bias) > 1e-6, axis=-1)
+            return [type_map[i] for i in range(len(type_map)) if bias_mask[i]]
+
         def set_out_bias(self, out_bias: paddle.Tensor) -> None:
             self.atomic_model.set_out_bias(out_bias)
 

From df132d4856a18af4b0c7c82b0c417fc9db878dae Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 17:52:01 +0800
Subject: [PATCH 25/63] add tests for get_model_def_script get_min_nbor_dist
 and set_case_embd

---
 source/tests/consistent/model/test_ener.py | 121 +++++++++++++++++++++
 1 file changed, 121 insertions(+)

diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 3049574e40..88e34633e2 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -806,6 +806,127 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = EnergyModelPT.deserialize(serialized)
+        pe_model = EnergyModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["energy"], dp1["energy"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same energy",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()

From 1da8708813567f439141ee7cf745045d641254cb Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 20:47:42 +0800
Subject: [PATCH 26/63] fix hlo

---
 deepmd/jax/model/hlo.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/deepmd/jax/model/hlo.py b/deepmd/jax/model/hlo.py
index 7eb4e2c4b3..c79bc727cf 100644
--- a/deepmd/jax/model/hlo.py
+++ b/deepmd/jax/model/hlo.py
@@ -265,6 +265,10 @@ def deserialize(cls, data: dict) -> "BaseModel":
         """
         raise NotImplementedError("Not implemented")
 
+    def get_observed_type_list(self) -> list[str]:
+        """Get observed types (elements) of the model during data statistics."""
+        raise NotImplementedError("Not implemented for HLO model")
+
     def get_model_def_script(self) -> str:
         """Get the model definition script."""
         return self.model_def_script

From b4d43f09ce191f0628cbc2abb387aa3c3665a03c Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 21:25:49 +0800
Subject: [PATCH 27/63] add dipole model api tests. mv get_observed_type_list
 to base

---
 deepmd/pt/model/model/ener_model.py          |   26 -
 deepmd/pt/model/model/make_model.py          |   26 +
 source/tests/consistent/model/test_dipole.py | 1256 +++++++++++++++++-
 3 files changed, 1280 insertions(+), 28 deletions(-)

diff --git a/deepmd/pt/model/model/ener_model.py b/deepmd/pt/model/model/ener_model.py
index 7dcd035412..1680d1e258 100644
--- a/deepmd/pt/model/model/ener_model.py
+++ b/deepmd/pt/model/model/ener_model.py
@@ -44,32 +44,6 @@ def enable_hessian(self) -> None:
         self.requires_hessian("energy")
         self._hessian_enabled = True
 
-    @torch.jit.export
-    def get_observed_type_list(self) -> list[str]:
-        """Get observed types (elements) of the model during data statistics.
-
-        Returns
-        -------
-        observed_type_list: a list of the observed types in this model.
-        """
-        type_map = self.get_type_map()
-        out_bias = self.atomic_model.get_out_bias()[0]
-
-        assert out_bias is not None, "No out_bias found in the model."
-        assert out_bias.dim() == 2, "The supported out_bias should be a 2D tensor."
-        assert out_bias.size(0) == len(type_map), (
-            "The out_bias shape does not match the type_map length."
-        )
-        bias_mask = (
-            torch.gt(torch.abs(out_bias), 1e-6).any(dim=-1).detach().cpu()
-        )  # 1e-6 for stability
-
-        observed_type_list: list[str] = []
-        for i in range(len(type_map)):
-            if bias_mask[i]:
-                observed_type_list.append(type_map[i])
-        return observed_type_list
-
     def translated_output_def(self) -> dict[str, Any]:
         out_def_data = self.model_output_def().get_data()
         output_def = {
diff --git a/deepmd/pt/model/model/make_model.py b/deepmd/pt/model/model/make_model.py
index 87a1d6b9c5..1cd7f3915f 100644
--- a/deepmd/pt/model/model/make_model.py
+++ b/deepmd/pt/model/model/make_model.py
@@ -591,6 +591,32 @@ def compute_or_load_stat(
             """Compute or load the statistics."""
             return self.atomic_model.compute_or_load_stat(sampled_func, stat_file_path)
 
+        @torch.jit.export
+        def get_observed_type_list(self) -> list[str]:
+            """Get observed types (elements) of the model during data statistics.
+
+            Returns
+            -------
+            observed_type_list: a list of the observed types in this model.
+            """
+            type_map = self.get_type_map()
+            out_bias = self.atomic_model.get_out_bias()[0]
+
+            assert out_bias is not None, "No out_bias found in the model."
+            assert out_bias.dim() == 2, "The supported out_bias should be a 2D tensor."
+            assert out_bias.size(0) == len(type_map), (
+                "The out_bias shape does not match the type_map length."
+            )
+            bias_mask = (
+                torch.gt(torch.abs(out_bias), 1e-6).any(dim=-1).detach().cpu()
+            )  # 1e-6 for stability
+
+            observed_type_list: list[str] = []
+            for i in range(len(type_map)):
+                if bias_mask[i]:
+                    observed_type_list.append(type_map[i])
+            return observed_type_list
+
         def get_sel(self) -> list[int]:
             """Returns the number of selected atoms for each type."""
             return self.atomic_model.get_sel()
diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index 7dd7f644cc..03468f9d04 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -6,8 +6,18 @@
 
 import numpy as np
 
+from deepmd.dpmodel.common import (
+    to_numpy_array,
+)
 from deepmd.dpmodel.model.dipole_model import DipoleModel as DipoleModelDP
 from deepmd.dpmodel.model.model import get_model as get_model_dp
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
@@ -18,6 +28,7 @@
     INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
+    parameterized,
 )
 from .common import (
     ModelTest,
@@ -26,6 +37,8 @@
 if INSTALLED_PT:
     from deepmd.pt.model.model import get_model as get_model_pt
     from deepmd.pt.model.model.dipole_model import DipoleModel as DipoleModelPT
+    from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+    from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
 else:
     DipoleModelPT = None
 if INSTALLED_TF:
@@ -38,6 +51,7 @@
 else:
     DipoleModelJAX = None
 if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.common import to_torch_array as pt_expt_numpy_to_torch
     from deepmd.pt_expt.model import DipoleModel as DipoleModelPTExpt
 else:
     DipoleModelPTExpt = None
@@ -240,7 +254,12 @@ def test_atom_exclude_types(self):
 
 @unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestDipoleModelAPIs(unittest.TestCase):
-    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+    """Test consistency of model-level APIs between pt and dpmodel backends.
+
+    Both models are constructed from the same serialized weights
+    (dpmodel -> serialize -> pt deserialize) so that numerical outputs
+    can be compared directly.
+    """
 
     def setUp(self) -> None:
         data = model_args().normalize_value(
@@ -262,18 +281,80 @@ def setUp(self) -> None:
                     "type": "dipole",
                     "neuron": [4, 4, 4],
                     "resnet_dt": True,
-                    "numb_fparam": 0,
                     "precision": "float64",
                     "seed": 1,
+                    "numb_fparam": 2,
+                    "numb_aparam": 3,
+                    "default_fparam": [0.5, -0.3],
                 },
             },
             trim_pattern="_*",
         )
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = DipoleModelPT.deserialize(serialized)
         self.pt_expt_model = DipoleModelPTExpt.deserialize(serialized)
 
+        # Coords / atype / box
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                00.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Build extended coords + nlist for lower-level calls
+        rcut = 6.0
+        nframes, nloc = self.atype.shape[:2]
+        coord_normalized = normalize_coord(
+            self.coords.reshape(nframes, nloc, 3),
+            self.box.reshape(nframes, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, self.atype, self.box, rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            nloc,
+            rcut,
+            [20, 20],
+            distinguish_types=True,
+        )
+        self.extended_coord = extended_coord.reshape(nframes, -1, 3)
+        self.extended_atype = extended_atype
+        self.mapping = mapping
+        self.nlist = nlist
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        rng = np.random.default_rng(42)
+        self.eval_aparam = rng.normal(size=(1, nloc, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -284,3 +365,1174 @@ def test_translated_output_def(self) -> None:
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
             self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
+
+    def test_get_descriptor(self) -> None:
+        """get_descriptor should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_descriptor())
+        self.assertIsNotNone(self.pt_model.get_descriptor())
+
+    def test_get_fitting_net(self) -> None:
+        """get_fitting_net should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_fitting_net())
+        self.assertIsNotNone(self.pt_model.get_fitting_net())
+
+    def test_get_out_bias(self) -> None:
+        """get_out_bias should return numerically equal values on dp and pt.
+
+        DipoleModel's apply_out_stat is a no-op, so bias won't affect output,
+        but the bias storage should still be consistent across backends.
+        """
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        # Verify shape: (n_output_keys x ntypes x 3) for dipole
+        self.assertEqual(dp_bias.shape[1], 2)  # ntypes
+        self.assertGreater(dp_bias.shape[0], 0)  # at least one output key
+
+    def test_set_out_bias(self) -> None:
+        """set_out_bias should update the bias on both backends."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        new_bias = dp_bias + 1.0
+        # dp
+        self.dp_model.set_out_bias(new_bias)
+        np.testing.assert_allclose(
+            to_numpy_array(self.dp_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        # pt
+        self.pt_model.set_out_bias(numpy_to_torch(new_bias))
+        np.testing.assert_allclose(
+            torch_to_numpy(self.pt_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_model_output_def(self) -> None:
+        """model_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.model_output_def().get_data()
+        pt_def = self.pt_model.model_output_def().get_data()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_model_output_type(self) -> None:
+        """model_output_type should return the same list on dp and pt."""
+        self.assertEqual(
+            self.dp_model.model_output_type(),
+            self.pt_model.model_output_type(),
+        )
+
+    def test_do_grad_r(self) -> None:
+        """do_grad_r should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_r("dipole"),
+            self.pt_model.do_grad_r("dipole"),
+        )
+        self.assertTrue(self.dp_model.do_grad_r("dipole"))
+
+    def test_do_grad_c(self) -> None:
+        """do_grad_c should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_c("dipole"),
+            self.pt_model.do_grad_c("dipole"),
+        )
+        self.assertTrue(self.dp_model.do_grad_c("dipole"))
+
+    def test_get_rcut(self) -> None:
+        """get_rcut should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_rcut(), self.pt_model.get_rcut())
+        self.assertAlmostEqual(self.dp_model.get_rcut(), 6.0)
+
+    def test_get_type_map(self) -> None:
+        """get_type_map should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_type_map(), self.pt_model.get_type_map())
+        self.assertEqual(self.dp_model.get_type_map(), ["O", "H"])
+
+    def test_get_sel(self) -> None:
+        """get_sel should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel(), self.pt_model.get_sel())
+        self.assertEqual(self.dp_model.get_sel(), [20, 20])
+
+    def test_get_nsel(self) -> None:
+        """get_nsel should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nsel(), self.pt_model.get_nsel())
+        self.assertEqual(self.dp_model.get_nsel(), 40)
+
+    def test_get_nnei(self) -> None:
+        """get_nnei should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nnei(), self.pt_model.get_nnei())
+        self.assertEqual(self.dp_model.get_nnei(), 40)
+
+    def test_mixed_types(self) -> None:
+        """mixed_types should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.mixed_types(), self.pt_model.mixed_types())
+        # se_e2_a is not mixed-types
+        self.assertFalse(self.dp_model.mixed_types())
+
+    def test_has_message_passing(self) -> None:
+        """has_message_passing should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_message_passing(),
+            self.pt_model.has_message_passing(),
+        )
+        self.assertFalse(self.dp_model.has_message_passing())
+
+    def test_need_sorted_nlist_for_lower(self) -> None:
+        """need_sorted_nlist_for_lower should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.need_sorted_nlist_for_lower(),
+            self.pt_model.need_sorted_nlist_for_lower(),
+        )
+        self.assertFalse(self.dp_model.need_sorted_nlist_for_lower())
+
+    def test_get_dim_fparam(self) -> None:
+        """get_dim_fparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
+        self.assertEqual(self.dp_model.get_dim_fparam(), 2)
+
+    def test_get_dim_aparam(self) -> None:
+        """get_dim_aparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
+        self.assertEqual(self.dp_model.get_dim_aparam(), 3)
+
+    def test_get_sel_type(self) -> None:
+        """get_sel_type should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel_type(), self.pt_model.get_sel_type())
+        self.assertEqual(self.dp_model.get_sel_type(), [0, 1])
+
+    def test_is_aparam_nall(self) -> None:
+        """is_aparam_nall should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
+        self.assertFalse(self.dp_model.is_aparam_nall())
+
+    def test_atomic_output_def(self) -> None:
+        """atomic_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.atomic_output_def()
+        pt_def = self.pt_model.atomic_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def.keys():
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_format_nlist(self) -> None:
+        """format_nlist should produce the same result on dp and pt."""
+        dp_nlist = self.dp_model.format_nlist(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+        )
+        pt_nlist = torch_to_numpy(
+            self.pt_model.format_nlist(
+                numpy_to_torch(self.extended_coord),
+                numpy_to_torch(self.extended_atype),
+                numpy_to_torch(self.nlist),
+            )
+        )
+        np.testing.assert_equal(dp_nlist, pt_nlist)
+
+    def test_forward_common_atomic(self) -> None:
+        """forward_common_atomic should produce consistent results on dp and pt.
+
+        Compares at the atomic_model level, where both backends define this method.
+        """
+        dp_ret = self.dp_model.atomic_model.forward_common_atomic(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+            mapping=self.mapping,
+            aparam=self.eval_aparam,
+        )
+        pt_ret = self.pt_model.atomic_model.forward_common_atomic(
+            numpy_to_torch(self.extended_coord),
+            numpy_to_torch(self.extended_atype),
+            numpy_to_torch(self.nlist),
+            mapping=numpy_to_torch(self.mapping),
+            aparam=numpy_to_torch(self.eval_aparam),
+        )
+        # Compare the common keys
+        common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
+        self.assertTrue(len(common_keys) > 0)
+        for key in common_keys:
+            if dp_ret[key] is not None and pt_ret[key] is not None:
+                np.testing.assert_allclose(
+                    dp_ret[key],
+                    torch_to_numpy(pt_ret[key]),
+                    rtol=1e-10,
+                    atol=1e-10,
+                    err_msg=f"Mismatch in forward_common_atomic key '{key}'",
+                )
+
+    def test_has_default_fparam(self) -> None:
+        """has_default_fparam should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_default_fparam(),
+            self.pt_model.has_default_fparam(),
+        )
+        self.assertTrue(self.dp_model.has_default_fparam())
+
+    def test_get_default_fparam(self) -> None:
+        """get_default_fparam should return consistent values on dp and pt."""
+        dp_val = self.dp_model.get_default_fparam()
+        pt_val = self.pt_model.get_default_fparam()
+        np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
+
+    def _get_fitting_stats(self, model, backend="dp"):
+        """Extract fparam/aparam stats from a model's fitting net."""
+        fitting = model.get_fitting_net()
+        if backend == "pt":
+            return {
+                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
+                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
+                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
+                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
+            }
+        else:
+            return {
+                "fparam_avg": to_numpy_array(fitting.fparam_avg),
+                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
+                "aparam_avg": to_numpy_array(fitting.aparam_avg),
+                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
+            }
+
+    def test_change_out_bias(self) -> None:
+        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+
+        Note: DipoleModel's apply_out_stat is a no-op, so bias doesn't affect output,
+        but the bias storage and fitting input stats should still be consistent.
+        """
+        nframes = 2
+        nloc = 6
+        numb_fparam = 2
+        numb_aparam = 3
+        rng = np.random.default_rng(123)
+
+        # Use realistic coords (from setUp, tiled for 2 frames)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        dipole_data = rng.normal(size=(nframes, 3)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        fparam_data = rng.normal(size=(nframes, numb_fparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        aparam_data = rng.normal(size=(nframes, nloc, numb_aparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dpmodel stat data (numpy)
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dipole": dipole_data,
+                "find_dipole": np.float32(1.0),
+                "fparam": fparam_data,
+                "aparam": aparam_data,
+            }
+        ]
+        # pt stat data (torch tensors)
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dipole": numpy_to_torch(dipole_data),
+                "find_dipole": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam_data),
+                "aparam": numpy_to_torch(aparam_data),
+            }
+        ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # Save initial fitting stats (all zeros / ones)
+        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
+
+        # Save initial (zero) bias
+        dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
+
+        # --- Test "set-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
+        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
+            )
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
+            )
+        # Verify fparam/aparam stats actually changed from initial values
+        self.assertFalse(
+            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
+            "set-by-statistic did not update fparam_avg",
+        )
+        self.assertFalse(
+            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
+            "set-by-statistic did not update aparam_avg",
+        )
+
+        # --- Test "change-by-statistic" mode ---
+        dp_bias_before = dp_bias.copy()
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
+        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_chg[stat_key],
+                dp_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pt_stats_chg[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pe_stats_chg[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
+            )
+
+    def test_change_type_map(self) -> None:
+        """change_type_map should produce consistent results on dp and pt.
+
+        Uses a DPA1 (se_atten) descriptor since se_e2_a does not support
+        change_type_map (non-mixed-types descriptors raise NotImplementedError).
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        data = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        pt_model = DipoleModelPT.deserialize(dp_model.serialize())
+
+        # Set non-zero out_bias so the swap is non-trivial
+        dp_bias_orig = to_numpy_array(dp_model.get_out_bias()).copy()
+        new_bias = dp_bias_orig.copy()
+        new_bias[:, 0, :] = 1.5  # type 0 ("O")
+        new_bias[:, 1, :] = -3.7  # type 1 ("H")
+        dp_model.set_out_bias(new_bias)
+        pt_model.set_out_bias(numpy_to_torch(new_bias))
+
+        new_type_map = ["H", "O"]
+        dp_model.change_type_map(new_type_map)
+        pt_model.change_type_map(new_type_map)
+
+        # Both should have the new type_map
+        self.assertEqual(dp_model.get_type_map(), new_type_map)
+        self.assertEqual(pt_model.get_type_map(), new_type_map)
+
+        # Out_bias should be reordered consistently between backends
+        dp_bias_new = to_numpy_array(dp_model.get_out_bias())
+        pt_bias_new = torch_to_numpy(pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias_new, pt_bias_new, rtol=1e-10, atol=1e-10)
+
+        # Verify the reorder is correct: old type 0 -> new type 1, old type 1 -> new type 0
+        np.testing.assert_allclose(
+            dp_bias_new[:, 0, :],
+            new_bias[:, 1, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            dp_bias_new[:, 1, :],
+            new_bias[:, 0, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_change_type_map_extend_stat(self) -> None:
+        """change_type_map with model_with_new_type_stat should propagate stats consistently across dp, pt, and pt_expt.
+
+        Verifies that the model-level change_type_map correctly unwraps
+        model_with_new_type_stat.atomic_model before forwarding to the
+        atomic model.
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        small_tm = ["O", "H"]
+        large_tm = ["O", "H", "Li"]
+
+        small_data = model_args_fn().normalize_value(
+            {
+                "type_map": small_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        large_data = model_args_fn().normalize_value(
+            {
+                "type_map": large_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 2,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        dp_small = get_model_dp(small_data)
+        dp_large = get_model_dp(large_data)
+
+        # Set distinguishable random stats on the large model's descriptor
+        rng = np.random.default_rng(42)
+        desc_large = dp_large.get_descriptor()
+        mean_large, std_large = desc_large.get_stat_mean_and_stddev()
+        mean_rand = rng.random(size=to_numpy_array(mean_large).shape)
+        std_rand = rng.random(size=to_numpy_array(std_large).shape)
+        desc_large.set_stat_mean_and_stddev(mean_rand, std_rand)
+
+        # Build pt and pt_expt models from dp serialization
+        pt_small = DipoleModelPT.deserialize(dp_small.serialize())
+        pt_large = DipoleModelPT.deserialize(dp_large.serialize())
+        pt_expt_small = DipoleModelPTExpt.deserialize(dp_small.serialize())
+        pt_expt_large = DipoleModelPTExpt.deserialize(dp_large.serialize())
+
+        # Extend type map with model_with_new_type_stat at the model level
+        dp_small.change_type_map(large_tm, model_with_new_type_stat=dp_large)
+        pt_small.change_type_map(large_tm, model_with_new_type_stat=pt_large)
+        pt_expt_small.change_type_map(large_tm, model_with_new_type_stat=pt_expt_large)
+
+        # Descriptor stats should be consistent across backends
+        dp_mean, dp_std = dp_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_mean, pt_std = pt_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_expt_mean, pt_expt_std = (
+            pt_expt_small.get_descriptor().get_stat_mean_and_stddev()
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            torch_to_numpy(pt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            torch_to_numpy(pt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            to_numpy_array(pt_expt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            to_numpy_array(pt_expt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_update_sel(self) -> None:
+        """update_sel should return the same result on dp and pt."""
+        from unittest.mock import (
+            patch,
+        )
+
+        from deepmd.dpmodel.model.dp_model import DPModelCommon as DPModelCommonDP
+        from deepmd.pt.model.model.dp_model import DPModelCommon as DPModelCommonPT
+
+        mock_min_nbor_dist = 0.5
+        mock_sel = [10, 20]
+        local_jdata = {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": "auto",
+                "rcut_smth": 0.50,
+                "rcut": 6.00,
+            },
+            "fitting_net": {
+                "type": "dipole",
+                "neuron": [4, 4, 4],
+            },
+        }
+        type_map = ["O", "H"]
+
+        with patch(
+            "deepmd.dpmodel.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            dp_result, dp_min_dist = DPModelCommonDP.update_sel(
+                None, type_map, local_jdata
+            )
+
+        with patch(
+            "deepmd.pt.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            pt_result, pt_min_dist = DPModelCommonPT.update_sel(
+                None, type_map, local_jdata
+            )
+
+        self.assertEqual(dp_result, pt_result)
+        self.assertEqual(dp_min_dist, pt_min_dist)
+        # Verify sel was actually updated (not still "auto")
+        self.assertIsInstance(dp_result["descriptor"]["sel"], list)
+        self.assertNotEqual(dp_result["descriptor"]["sel"], "auto")
+
+    def test_get_ntypes(self) -> None:
+        """get_ntypes should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_ntypes(), self.pt_model.get_ntypes())
+        self.assertEqual(self.dp_model.get_ntypes(), 2)
+
+    def test_compute_or_load_out_stat(self) -> None:
+        """compute_or_load_out_stat should produce consistent bias on dp and pt.
+
+        Tests both the compute path (from data) and the load path (from file).
+        Note: DipoleModel's apply_out_stat is a no-op, so bias doesn't affect
+        output, but the stored bias should still be consistent.
+        """
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        nframes = 2
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        dipole_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 3))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dipole": dipole_data,
+                "find_dipole": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dipole": numpy_to_torch(dipole_data),
+                "find_dipole": np.float32(1.0),
+            }
+        ]
+
+        # Verify bias is initially identical
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate h5 files for dp and pt
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            with h5py.File(dp_h5, "w"):
+                pass
+            with h5py.File(pt_h5, "w"):
+                pass
+            dp_stat_path = DPPath(dp_h5, "a")
+            pt_stat_path = DPPath(pt_h5, "a")
+
+            # 1. Compute stats and save to file
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                dp_merged, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                pt_merged, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_after = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_after = torch_to_numpy(self.pt_model.get_out_bias())
+            np.testing.assert_allclose(
+                dp_bias_after, pt_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+            # 2. Verify both backends saved the same file content
+            with h5py.File(dp_h5, "r") as dp_f, h5py.File(pt_h5, "r") as pt_f:
+                dp_keys = sorted(dp_f.keys())
+                pt_keys = sorted(pt_f.keys())
+                self.assertEqual(dp_keys, pt_keys)
+                for key in dp_keys:
+                    np.testing.assert_allclose(
+                        np.array(dp_f[key]),
+                        np.array(pt_f[key]),
+                        rtol=1e-10,
+                        atol=1e-10,
+                        err_msg=f"Stat file content mismatch for key {key}",
+                    )
+
+            # 3. Reset biases to zero, then load from file
+            zero_bias = np.zeros_like(dp_bias_after)
+            self.dp_model.set_out_bias(zero_bias)
+            self.pt_model.set_out_bias(numpy_to_torch(zero_bias))
+
+            # Use a callable that raises to ensure it loads from file, not recomputes
+            def raise_error():
+                raise RuntimeError("Should not recompute — should load from file")
+
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_loaded = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_loaded = torch_to_numpy(self.pt_model.get_out_bias())
+
+            # Loaded biases should match between backends
+            np.testing.assert_allclose(
+                dp_bias_loaded, pt_bias_loaded, rtol=1e-10, atol=1e-10
+            )
+            # Loaded biases should match the originally computed biases
+            np.testing.assert_allclose(
+                dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that type 1 ("H") is
+        unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — type 1 is unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[natoms, natoms, natoms, 0]] * nframes, dtype=np.int32)
+        dipole_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 3))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dipole": dipole_data,
+                "find_dipole": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dipole": numpy_to_torch(dipole_data),
+                "find_dipole": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # Only type 0 ("O") should be observed
+        self.assertEqual(dp_observed, ["O"])
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+    (False, True),  # fparam_in_data
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestDipoleComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd), fitting stats (fparam, aparam), and output bias.
+    Parameterized over exclusion types and whether fparam is explicitly provided or
+    injected via default_fparam.
+    """
+
+    def setUp(self) -> None:
+        (pair_exclude_types, atom_exclude_types), self.fparam_in_data = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "dpa3",
+                    "repflow": {
+                        "n_dim": 20,
+                        "e_dim": 10,
+                        "a_dim": 8,
+                        "nlayers": 3,
+                        "e_rcut": 6.0,
+                        "e_rcut_smth": 5.0,
+                        "e_sel": 10,
+                        "a_rcut": 4.0,
+                        "a_rcut_smth": 3.5,
+                        "a_sel": 8,
+                        "axis_neuron": 4,
+                        "update_angle": True,
+                        "update_style": "res_residual",
+                        "update_residual": 0.1,
+                        "update_residual_init": "const",
+                    },
+                    "precision": "float64",
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [10, 10],
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                    "default_fparam": [0.5, -0.3],
+                    "numb_aparam": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DipoleModelPT.deserialize(serialized)
+        self.pt_expt_model = DipoleModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array([[natoms, natoms, 2, 4]] * nframes, dtype=np.int32)
+        dipole_stat = rng.normal(size=(nframes, 3)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        aparam_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "dipole": dipole_stat,
+            "find_dipole": np.float32(1.0),
+            "aparam": aparam_stat,
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "dipole": numpy_to_torch(dipole_stat),
+            "find_dipole": np.float32(1.0),
+            "aparam": numpy_to_torch(aparam_stat),
+        }
+
+        if self.fparam_in_data:
+            fparam_stat = rng.normal(size=(nframes, 2)).astype(
+                GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["fparam"] = fparam_stat
+            pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
+        else:
+            # No fparam → _make_wrapped_sampler injects default_fparam
+            self.expected_fparam_avg = np.array([0.5, -0.3])
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        self.eval_aparam = rng.normal(size=(1, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(
+            self.coords, self.atype, box=self.box, aparam=self.eval_aparam
+        )
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                aparam=numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                aparam=pt_expt_numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("global_dipole", "dipole"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
+        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
+        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        # Note: DipoleModel's apply_out_stat is a no-op, so output won't change
+        # after stat computation, but we still verify cross-backend consistency.
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("global_dipole", "dipole"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 5. Non-triviality checks
+        fit_vars = dp_ser["fitting"]["@variables"]
+        # fparam stats were computed
+        fparam_avg = np.asarray(fit_vars["fparam_avg"])
+        self.assertFalse(
+            np.allclose(fparam_avg, 0.0),
+            "fparam_avg is still zero — fparam stats were not computed",
+        )
+        np.testing.assert_allclose(
+            fparam_avg,
+            self.expected_fparam_avg,
+            rtol=1e-10,
+            atol=1e-10,
+            err_msg="fparam_avg does not match expected values",
+        )
+        # aparam stats were computed
+        aparam_avg = np.asarray(fit_vars["aparam_avg"])
+        self.assertFalse(
+            np.allclose(aparam_avg, 0.0),
+            "aparam_avg is still zero — aparam stats were not computed",
+        )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file
+            self.dp_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(dp_h5, "a")
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: self.pt_sampled, stat_file_path=DPPath(pt_h5, "a")
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = DipoleModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = DipoleModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From 6ac0cef55e1f2d04014b2740e4cb6cf185212fed Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 22:32:40 +0800
Subject: [PATCH 28/63] fix frozen model

---
 deepmd/pd/model/model/frozen.py | 4 ++++
 deepmd/pt/model/model/frozen.py | 4 ++++
 2 files changed, 8 insertions(+)

diff --git a/deepmd/pd/model/model/frozen.py b/deepmd/pd/model/model/frozen.py
index 365202dd6c..c4d5762530 100644
--- a/deepmd/pd/model/model/frozen.py
+++ b/deepmd/pd/model/model/frozen.py
@@ -178,6 +178,10 @@ def update_sel(
         """
         return local_jdata, None
 
+    def get_observed_type_list(self) -> list[str]:
+        """Get observed types (elements) of the model during data statistics."""
+        return self.model.get_observed_type_list()
+
     def model_output_type(self) -> str:
         """Get the output type for the model."""
         return self.model.model_output_type()
diff --git a/deepmd/pt/model/model/frozen.py b/deepmd/pt/model/model/frozen.py
index 402e78e95c..d44c608ade 100644
--- a/deepmd/pt/model/model/frozen.py
+++ b/deepmd/pt/model/model/frozen.py
@@ -198,6 +198,10 @@ def update_sel(
         """
         return local_jdata, None
 
+    def get_observed_type_list(self) -> list[str]:
+        """Get observed types (elements) of the model during data statistics."""
+        return self.model.get_observed_type_list()
+
     @torch.jit.export
     def model_output_type(self) -> str:
         """Get the output type for the model."""

From 4b54857c1e844731eaa7753cb6ab451249578692 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 22:49:33 +0800
Subject: [PATCH 29/63] add polar model api tests.

---
 source/tests/consistent/model/test_polar.py | 1256 ++++++++++++++++++-
 1 file changed, 1254 insertions(+), 2 deletions(-)

diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index a8cd8c0ac6..7d2136bac3 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -6,8 +6,18 @@
 
 import numpy as np
 
+from deepmd.dpmodel.common import (
+    to_numpy_array,
+)
 from deepmd.dpmodel.model.model import get_model as get_model_dp
 from deepmd.dpmodel.model.polar_model import PolarModel as PolarModelDP
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
@@ -18,6 +28,7 @@
     INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
+    parameterized,
 )
 from .common import (
     ModelTest,
@@ -26,6 +37,8 @@
 if INSTALLED_PT:
     from deepmd.pt.model.model import get_model as get_model_pt
     from deepmd.pt.model.model.polar_model import PolarModel as PolarModelPT
+    from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+    from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
 else:
     PolarModelPT = None
 if INSTALLED_TF:
@@ -38,6 +51,7 @@
 else:
     PolarModelJAX = None
 if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.common import to_torch_array as pt_expt_numpy_to_torch
     from deepmd.pt_expt.model import PolarModel as PolarModelPTExpt
 else:
     PolarModelPTExpt = None
@@ -234,7 +248,12 @@ def test_atom_exclude_types(self):
 
 @unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestPolarModelAPIs(unittest.TestCase):
-    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+    """Test consistency of model-level APIs between pt and dpmodel backends.
+
+    Both models are constructed from the same serialized weights
+    (dpmodel -> serialize -> pt deserialize) so that numerical outputs
+    can be compared directly.
+    """
 
     def setUp(self) -> None:
         data = model_args().normalize_value(
@@ -256,18 +275,80 @@ def setUp(self) -> None:
                     "type": "polar",
                     "neuron": [4, 4, 4],
                     "resnet_dt": True,
-                    "numb_fparam": 0,
                     "precision": "float64",
                     "seed": 1,
+                    "numb_fparam": 2,
+                    "numb_aparam": 3,
+                    "default_fparam": [0.5, -0.3],
                 },
             },
             trim_pattern="_*",
         )
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = PolarModelPT.deserialize(serialized)
         self.pt_expt_model = PolarModelPTExpt.deserialize(serialized)
 
+        # Coords / atype / box
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                00.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Build extended coords + nlist for lower-level calls
+        rcut = 6.0
+        nframes, nloc = self.atype.shape[:2]
+        coord_normalized = normalize_coord(
+            self.coords.reshape(nframes, nloc, 3),
+            self.box.reshape(nframes, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, self.atype, self.box, rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            nloc,
+            rcut,
+            [20, 20],
+            distinguish_types=True,
+        )
+        self.extended_coord = extended_coord.reshape(nframes, -1, 3)
+        self.extended_atype = extended_atype
+        self.mapping = mapping
+        self.nlist = nlist
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        rng = np.random.default_rng(42)
+        self.eval_aparam = rng.normal(size=(1, nloc, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -278,3 +359,1174 @@ def test_translated_output_def(self) -> None:
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
             self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
+
+    def test_get_descriptor(self) -> None:
+        """get_descriptor should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_descriptor())
+        self.assertIsNotNone(self.pt_model.get_descriptor())
+
+    def test_get_fitting_net(self) -> None:
+        """get_fitting_net should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_fitting_net())
+        self.assertIsNotNone(self.pt_model.get_fitting_net())
+
+    def test_get_out_bias(self) -> None:
+        """get_out_bias should return numerically equal values on dp and pt.
+
+        PolarModel's apply_out_stat applies diagonal bias with scale,
+        so the bias storage should be consistent across backends.
+        """
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        # Verify shape: (n_output_keys x ntypes x 9) for polar
+        self.assertEqual(dp_bias.shape[1], 2)  # ntypes
+        self.assertGreater(dp_bias.shape[0], 0)  # at least one output key
+
+    def test_set_out_bias(self) -> None:
+        """set_out_bias should update the bias on both backends."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        new_bias = dp_bias + 1.0
+        # dp
+        self.dp_model.set_out_bias(new_bias)
+        np.testing.assert_allclose(
+            to_numpy_array(self.dp_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        # pt
+        self.pt_model.set_out_bias(numpy_to_torch(new_bias))
+        np.testing.assert_allclose(
+            torch_to_numpy(self.pt_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_model_output_def(self) -> None:
+        """model_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.model_output_def().get_data()
+        pt_def = self.pt_model.model_output_def().get_data()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_model_output_type(self) -> None:
+        """model_output_type should return the same list on dp and pt."""
+        self.assertEqual(
+            self.dp_model.model_output_type(),
+            self.pt_model.model_output_type(),
+        )
+
+    def test_do_grad_r(self) -> None:
+        """do_grad_r should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_r("polarizability"),
+            self.pt_model.do_grad_r("polarizability"),
+        )
+        self.assertFalse(self.dp_model.do_grad_r("polarizability"))
+
+    def test_do_grad_c(self) -> None:
+        """do_grad_c should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_c("polarizability"),
+            self.pt_model.do_grad_c("polarizability"),
+        )
+        self.assertFalse(self.dp_model.do_grad_c("polarizability"))
+
+    def test_get_rcut(self) -> None:
+        """get_rcut should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_rcut(), self.pt_model.get_rcut())
+        self.assertAlmostEqual(self.dp_model.get_rcut(), 6.0)
+
+    def test_get_type_map(self) -> None:
+        """get_type_map should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_type_map(), self.pt_model.get_type_map())
+        self.assertEqual(self.dp_model.get_type_map(), ["O", "H"])
+
+    def test_get_sel(self) -> None:
+        """get_sel should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel(), self.pt_model.get_sel())
+        self.assertEqual(self.dp_model.get_sel(), [20, 20])
+
+    def test_get_nsel(self) -> None:
+        """get_nsel should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nsel(), self.pt_model.get_nsel())
+        self.assertEqual(self.dp_model.get_nsel(), 40)
+
+    def test_get_nnei(self) -> None:
+        """get_nnei should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nnei(), self.pt_model.get_nnei())
+        self.assertEqual(self.dp_model.get_nnei(), 40)
+
+    def test_mixed_types(self) -> None:
+        """mixed_types should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.mixed_types(), self.pt_model.mixed_types())
+        # se_e2_a is not mixed-types
+        self.assertFalse(self.dp_model.mixed_types())
+
+    def test_has_message_passing(self) -> None:
+        """has_message_passing should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_message_passing(),
+            self.pt_model.has_message_passing(),
+        )
+        self.assertFalse(self.dp_model.has_message_passing())
+
+    def test_need_sorted_nlist_for_lower(self) -> None:
+        """need_sorted_nlist_for_lower should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.need_sorted_nlist_for_lower(),
+            self.pt_model.need_sorted_nlist_for_lower(),
+        )
+        self.assertFalse(self.dp_model.need_sorted_nlist_for_lower())
+
+    def test_get_dim_fparam(self) -> None:
+        """get_dim_fparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
+        self.assertEqual(self.dp_model.get_dim_fparam(), 2)
+
+    def test_get_dim_aparam(self) -> None:
+        """get_dim_aparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
+        self.assertEqual(self.dp_model.get_dim_aparam(), 3)
+
+    def test_get_sel_type(self) -> None:
+        """get_sel_type should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel_type(), self.pt_model.get_sel_type())
+        self.assertEqual(self.dp_model.get_sel_type(), [0, 1])
+
+    def test_is_aparam_nall(self) -> None:
+        """is_aparam_nall should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
+        self.assertFalse(self.dp_model.is_aparam_nall())
+
+    def test_atomic_output_def(self) -> None:
+        """atomic_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.atomic_output_def()
+        pt_def = self.pt_model.atomic_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def.keys():
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_format_nlist(self) -> None:
+        """format_nlist should produce the same result on dp and pt."""
+        dp_nlist = self.dp_model.format_nlist(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+        )
+        pt_nlist = torch_to_numpy(
+            self.pt_model.format_nlist(
+                numpy_to_torch(self.extended_coord),
+                numpy_to_torch(self.extended_atype),
+                numpy_to_torch(self.nlist),
+            )
+        )
+        np.testing.assert_equal(dp_nlist, pt_nlist)
+
+    def test_forward_common_atomic(self) -> None:
+        """forward_common_atomic should produce consistent results on dp and pt.
+
+        Compares at the atomic_model level, where both backends define this method.
+        """
+        dp_ret = self.dp_model.atomic_model.forward_common_atomic(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+            mapping=self.mapping,
+            aparam=self.eval_aparam,
+        )
+        pt_ret = self.pt_model.atomic_model.forward_common_atomic(
+            numpy_to_torch(self.extended_coord),
+            numpy_to_torch(self.extended_atype),
+            numpy_to_torch(self.nlist),
+            mapping=numpy_to_torch(self.mapping),
+            aparam=numpy_to_torch(self.eval_aparam),
+        )
+        # Compare the common keys
+        common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
+        self.assertTrue(len(common_keys) > 0)
+        for key in common_keys:
+            if dp_ret[key] is not None and pt_ret[key] is not None:
+                np.testing.assert_allclose(
+                    dp_ret[key],
+                    torch_to_numpy(pt_ret[key]),
+                    rtol=1e-10,
+                    atol=1e-10,
+                    err_msg=f"Mismatch in forward_common_atomic key '{key}'",
+                )
+
+    def test_has_default_fparam(self) -> None:
+        """has_default_fparam should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_default_fparam(),
+            self.pt_model.has_default_fparam(),
+        )
+        self.assertTrue(self.dp_model.has_default_fparam())
+
+    def test_get_default_fparam(self) -> None:
+        """get_default_fparam should return consistent values on dp and pt."""
+        dp_val = self.dp_model.get_default_fparam()
+        pt_val = self.pt_model.get_default_fparam()
+        np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
+
+    def _get_fitting_stats(self, model, backend="dp"):
+        """Extract fparam/aparam stats from a model's fitting net."""
+        fitting = model.get_fitting_net()
+        if backend == "pt":
+            return {
+                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
+                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
+                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
+                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
+            }
+        else:
+            return {
+                "fparam_avg": to_numpy_array(fitting.fparam_avg),
+                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
+                "aparam_avg": to_numpy_array(fitting.aparam_avg),
+                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
+            }
+
+    def test_change_out_bias(self) -> None:
+        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+
+        PolarModel's apply_out_stat applies diagonal bias with scale,
+        so set-by-statistic should change the bias from initial values.
+        """
+        nframes = 2
+        nloc = 6
+        numb_fparam = 2
+        numb_aparam = 3
+        rng = np.random.default_rng(123)
+
+        # Use realistic coords (from setUp, tiled for 2 frames)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        polar_data = rng.normal(size=(nframes, 9)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        fparam_data = rng.normal(size=(nframes, numb_fparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        aparam_data = rng.normal(size=(nframes, nloc, numb_aparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dpmodel stat data (numpy)
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "polarizability": polar_data,
+                "find_polarizability": np.float32(1.0),
+                "fparam": fparam_data,
+                "aparam": aparam_data,
+            }
+        ]
+        # pt stat data (torch tensors)
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "polarizability": numpy_to_torch(polar_data),
+                "find_polarizability": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam_data),
+                "aparam": numpy_to_torch(aparam_data),
+            }
+        ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # Save initial fitting stats (all zeros / ones)
+        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
+
+        # Save initial (zero) bias
+        dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
+
+        # --- Test "set-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
+        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
+            )
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
+            )
+        # Verify fparam/aparam stats actually changed from initial values
+        self.assertFalse(
+            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
+            "set-by-statistic did not update fparam_avg",
+        )
+        self.assertFalse(
+            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
+            "set-by-statistic did not update aparam_avg",
+        )
+
+        # --- Test "change-by-statistic" mode ---
+        dp_bias_before = dp_bias.copy()
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
+        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_chg[stat_key],
+                dp_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pt_stats_chg[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pe_stats_chg[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
+            )
+
+    def test_change_type_map(self) -> None:
+        """change_type_map should produce consistent results on dp and pt.
+
+        Uses a DPA1 (se_atten) descriptor since se_e2_a does not support
+        change_type_map (non-mixed-types descriptors raise NotImplementedError).
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        data = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        pt_model = PolarModelPT.deserialize(dp_model.serialize())
+
+        # Set non-zero out_bias so the swap is non-trivial
+        dp_bias_orig = to_numpy_array(dp_model.get_out_bias()).copy()
+        new_bias = dp_bias_orig.copy()
+        new_bias[:, 0, :] = 1.5  # type 0 ("O")
+        new_bias[:, 1, :] = -3.7  # type 1 ("H")
+        dp_model.set_out_bias(new_bias)
+        pt_model.set_out_bias(numpy_to_torch(new_bias))
+
+        new_type_map = ["H", "O"]
+        dp_model.change_type_map(new_type_map)
+        pt_model.change_type_map(new_type_map)
+
+        # Both should have the new type_map
+        self.assertEqual(dp_model.get_type_map(), new_type_map)
+        self.assertEqual(pt_model.get_type_map(), new_type_map)
+
+        # Out_bias should be reordered consistently between backends
+        dp_bias_new = to_numpy_array(dp_model.get_out_bias())
+        pt_bias_new = torch_to_numpy(pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias_new, pt_bias_new, rtol=1e-10, atol=1e-10)
+
+        # Verify the reorder is correct: old type 0 -> new type 1, old type 1 -> new type 0
+        np.testing.assert_allclose(
+            dp_bias_new[:, 0, :],
+            new_bias[:, 1, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            dp_bias_new[:, 1, :],
+            new_bias[:, 0, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_change_type_map_extend_stat(self) -> None:
+        """change_type_map with model_with_new_type_stat should propagate stats consistently across dp, pt, and pt_expt.
+
+        Verifies that the model-level change_type_map correctly unwraps
+        model_with_new_type_stat.atomic_model before forwarding to the
+        atomic model.
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        small_tm = ["O", "H"]
+        large_tm = ["O", "H", "Li"]
+
+        small_data = model_args_fn().normalize_value(
+            {
+                "type_map": small_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        large_data = model_args_fn().normalize_value(
+            {
+                "type_map": large_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 2,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        dp_small = get_model_dp(small_data)
+        dp_large = get_model_dp(large_data)
+
+        # Set distinguishable random stats on the large model's descriptor
+        rng = np.random.default_rng(42)
+        desc_large = dp_large.get_descriptor()
+        mean_large, std_large = desc_large.get_stat_mean_and_stddev()
+        mean_rand = rng.random(size=to_numpy_array(mean_large).shape)
+        std_rand = rng.random(size=to_numpy_array(std_large).shape)
+        desc_large.set_stat_mean_and_stddev(mean_rand, std_rand)
+
+        # Build pt and pt_expt models from dp serialization
+        pt_small = PolarModelPT.deserialize(dp_small.serialize())
+        pt_large = PolarModelPT.deserialize(dp_large.serialize())
+        pt_expt_small = PolarModelPTExpt.deserialize(dp_small.serialize())
+        pt_expt_large = PolarModelPTExpt.deserialize(dp_large.serialize())
+
+        # Extend type map with model_with_new_type_stat at the model level
+        dp_small.change_type_map(large_tm, model_with_new_type_stat=dp_large)
+        pt_small.change_type_map(large_tm, model_with_new_type_stat=pt_large)
+        pt_expt_small.change_type_map(large_tm, model_with_new_type_stat=pt_expt_large)
+
+        # Descriptor stats should be consistent across backends
+        dp_mean, dp_std = dp_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_mean, pt_std = pt_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_expt_mean, pt_expt_std = (
+            pt_expt_small.get_descriptor().get_stat_mean_and_stddev()
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            torch_to_numpy(pt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            torch_to_numpy(pt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            to_numpy_array(pt_expt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            to_numpy_array(pt_expt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_update_sel(self) -> None:
+        """update_sel should return the same result on dp and pt."""
+        from unittest.mock import (
+            patch,
+        )
+
+        from deepmd.dpmodel.model.dp_model import DPModelCommon as DPModelCommonDP
+        from deepmd.pt.model.model.dp_model import DPModelCommon as DPModelCommonPT
+
+        mock_min_nbor_dist = 0.5
+        mock_sel = [10, 20]
+        local_jdata = {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": "auto",
+                "rcut_smth": 0.50,
+                "rcut": 6.00,
+            },
+            "fitting_net": {
+                "type": "polar",
+                "neuron": [4, 4, 4],
+            },
+        }
+        type_map = ["O", "H"]
+
+        with patch(
+            "deepmd.dpmodel.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            dp_result, dp_min_dist = DPModelCommonDP.update_sel(
+                None, type_map, local_jdata
+            )
+
+        with patch(
+            "deepmd.pt.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            pt_result, pt_min_dist = DPModelCommonPT.update_sel(
+                None, type_map, local_jdata
+            )
+
+        self.assertEqual(dp_result, pt_result)
+        self.assertEqual(dp_min_dist, pt_min_dist)
+        # Verify sel was actually updated (not still "auto")
+        self.assertIsInstance(dp_result["descriptor"]["sel"], list)
+        self.assertNotEqual(dp_result["descriptor"]["sel"], "auto")
+
+    def test_get_ntypes(self) -> None:
+        """get_ntypes should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_ntypes(), self.pt_model.get_ntypes())
+        self.assertEqual(self.dp_model.get_ntypes(), 2)
+
+    def test_compute_or_load_out_stat(self) -> None:
+        """compute_or_load_out_stat should produce consistent bias on dp and pt.
+
+        Tests both the compute path (from data) and the load path (from file).
+        PolarModel's apply_out_stat applies diagonal bias with scale,
+        so the stored bias should be consistent across backends.
+        """
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        nframes = 2
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        polar_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 9))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "polarizability": polar_data,
+                "find_polarizability": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "polarizability": numpy_to_torch(polar_data),
+                "find_polarizability": np.float32(1.0),
+            }
+        ]
+
+        # Verify bias is initially identical
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate h5 files for dp and pt
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            with h5py.File(dp_h5, "w"):
+                pass
+            with h5py.File(pt_h5, "w"):
+                pass
+            dp_stat_path = DPPath(dp_h5, "a")
+            pt_stat_path = DPPath(pt_h5, "a")
+
+            # 1. Compute stats and save to file
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                dp_merged, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                pt_merged, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_after = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_after = torch_to_numpy(self.pt_model.get_out_bias())
+            np.testing.assert_allclose(
+                dp_bias_after, pt_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+            # 2. Verify both backends saved the same file content
+            with h5py.File(dp_h5, "r") as dp_f, h5py.File(pt_h5, "r") as pt_f:
+                dp_keys = sorted(dp_f.keys())
+                pt_keys = sorted(pt_f.keys())
+                self.assertEqual(dp_keys, pt_keys)
+                for key in dp_keys:
+                    np.testing.assert_allclose(
+                        np.array(dp_f[key]),
+                        np.array(pt_f[key]),
+                        rtol=1e-10,
+                        atol=1e-10,
+                        err_msg=f"Stat file content mismatch for key {key}",
+                    )
+
+            # 3. Reset biases to zero, then load from file
+            zero_bias = np.zeros_like(dp_bias_after)
+            self.dp_model.set_out_bias(zero_bias)
+            self.pt_model.set_out_bias(numpy_to_torch(zero_bias))
+
+            # Use a callable that raises to ensure it loads from file, not recomputes
+            def raise_error():
+                raise RuntimeError("Should not recompute — should load from file")
+
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_loaded = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_loaded = torch_to_numpy(self.pt_model.get_out_bias())
+
+            # Loaded biases should match between backends
+            np.testing.assert_allclose(
+                dp_bias_loaded, pt_bias_loaded, rtol=1e-10, atol=1e-10
+            )
+            # Loaded biases should match the originally computed biases
+            np.testing.assert_allclose(
+                dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that type 1 ("H") is
+        unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — type 1 is unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[natoms, natoms, natoms, 0]] * nframes, dtype=np.int32)
+        polar_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 9))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "polarizability": polar_data,
+                "find_polarizability": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "polarizability": numpy_to_torch(polar_data),
+                "find_polarizability": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # Only type 0 ("O") should be observed
+        self.assertEqual(dp_observed, ["O"])
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+    (False, True),  # fparam_in_data
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestPolarComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd), fitting stats (fparam, aparam), and output bias.
+    Parameterized over exclusion types and whether fparam is explicitly provided or
+    injected via default_fparam.
+    """
+
+    def setUp(self) -> None:
+        (pair_exclude_types, atom_exclude_types), self.fparam_in_data = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "dpa3",
+                    "repflow": {
+                        "n_dim": 20,
+                        "e_dim": 10,
+                        "a_dim": 8,
+                        "nlayers": 3,
+                        "e_rcut": 6.0,
+                        "e_rcut_smth": 5.0,
+                        "e_sel": 10,
+                        "a_rcut": 4.0,
+                        "a_rcut_smth": 3.5,
+                        "a_sel": 8,
+                        "axis_neuron": 4,
+                        "update_angle": True,
+                        "update_style": "res_residual",
+                        "update_residual": 0.1,
+                        "update_residual_init": "const",
+                    },
+                    "precision": "float64",
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [10, 10],
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                    "default_fparam": [0.5, -0.3],
+                    "numb_aparam": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = PolarModelPT.deserialize(serialized)
+        self.pt_expt_model = PolarModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array([[natoms, natoms, 2, 4]] * nframes, dtype=np.int32)
+        polar_stat = rng.normal(size=(nframes, 9)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        aparam_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "polarizability": polar_stat,
+            "find_polarizability": np.float32(1.0),
+            "aparam": aparam_stat,
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "polarizability": numpy_to_torch(polar_stat),
+            "find_polarizability": np.float32(1.0),
+            "aparam": numpy_to_torch(aparam_stat),
+        }
+
+        if self.fparam_in_data:
+            fparam_stat = rng.normal(size=(nframes, 2)).astype(
+                GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["fparam"] = fparam_stat
+            pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
+        else:
+            # No fparam → _make_wrapped_sampler injects default_fparam
+            self.expected_fparam_avg = np.array([0.5, -0.3])
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        self.eval_aparam = rng.normal(size=(1, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(
+            self.coords, self.atype, box=self.box, aparam=self.eval_aparam
+        )
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                aparam=numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                aparam=pt_expt_numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("global_polar", "polar"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
+        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
+        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        # PolarModel's apply_out_stat applies diagonal bias with scale, so
+        # output values WILL differ from pre-stat after stat computation.
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("global_polar", "polar"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 5. Non-triviality checks
+        fit_vars = dp_ser["fitting"]["@variables"]
+        # fparam stats were computed
+        fparam_avg = np.asarray(fit_vars["fparam_avg"])
+        self.assertFalse(
+            np.allclose(fparam_avg, 0.0),
+            "fparam_avg is still zero — fparam stats were not computed",
+        )
+        np.testing.assert_allclose(
+            fparam_avg,
+            self.expected_fparam_avg,
+            rtol=1e-10,
+            atol=1e-10,
+            err_msg="fparam_avg does not match expected values",
+        )
+        # aparam stats were computed
+        aparam_avg = np.asarray(fit_vars["aparam_avg"])
+        self.assertFalse(
+            np.allclose(aparam_avg, 0.0),
+            "aparam_avg is still zero — aparam stats were not computed",
+        )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file
+            self.dp_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(dp_h5, "a")
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: self.pt_sampled, stat_file_path=DPPath(pt_h5, "a")
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = PolarModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = PolarModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From c35ee542dc50ca47c1414df6efd694531c785ee1 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 24 Feb 2026 23:55:08 +0800
Subject: [PATCH 30/63] add property model api tests, fix bugs

---
 .../atomic_model/property_atomic_model.py     |    8 +
 .../model/atomic_model/base_atomic_model.py   |    2 +
 .../tests/consistent/model/test_property.py   | 1262 ++++++++++++++++-
 3 files changed, 1270 insertions(+), 2 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/property_atomic_model.py b/deepmd/dpmodel/atomic_model/property_atomic_model.py
index ec65f949e0..07dd00b109 100644
--- a/deepmd/dpmodel/atomic_model/property_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/property_atomic_model.py
@@ -25,6 +25,14 @@ def __init__(
             )
         super().__init__(descriptor, fitting, type_map, **kwargs)
 
+    def get_compute_stats_distinguish_types(self) -> bool:
+        """Get whether the fitting net computes stats which are not distinguished between different types of atoms."""
+        return False
+
+    def get_intensive(self) -> bool:
+        """Whether the fitting property is intensive."""
+        return self.fitting_net.intensive
+
     def apply_out_stat(
         self,
         ret: dict[str, Array],
diff --git a/deepmd/pt/model/atomic_model/base_atomic_model.py b/deepmd/pt/model/atomic_model/base_atomic_model.py
index ee68718230..920b83d12b 100644
--- a/deepmd/pt/model/atomic_model/base_atomic_model.py
+++ b/deepmd/pt/model/atomic_model/base_atomic_model.py
@@ -482,6 +482,8 @@ def change_out_bias(
                 model_forward=self._get_forward_wrapper_func(),
                 rcond=self.rcond,
                 preset_bias=self.preset_out_bias,
+                stats_distinguish_types=self.get_compute_stats_distinguish_types(),
+                intensive=self.get_intensive(),
             )
             self._store_out_stat(delta_bias, out_std, add=True)
         elif bias_adjust_mode == "set-by-statistic":
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 2c4bf31114..d3829fbad7 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -6,8 +6,18 @@
 
 import numpy as np
 
+from deepmd.dpmodel.common import (
+    to_numpy_array,
+)
 from deepmd.dpmodel.model.model import get_model as get_model_dp
 from deepmd.dpmodel.model.property_model import PropertyModel as PropertyModelDP
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
@@ -17,6 +27,7 @@
     INSTALLED_PT,
     INSTALLED_PT_EXPT,
     CommonTest,
+    parameterized,
 )
 from .common import (
     ModelTest,
@@ -25,6 +36,8 @@
 if INSTALLED_PT:
     from deepmd.pt.model.model import get_model as get_model_pt
     from deepmd.pt.model.model.property_model import PropertyModel as PropertyModelPT
+    from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+    from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
 else:
     PropertyModelPT = None
 if INSTALLED_JAX:
@@ -33,6 +46,7 @@
 else:
     PropertyModelJAX = None
 if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.common import to_torch_array as pt_expt_numpy_to_torch
     from deepmd.pt_expt.model import PropertyModel as PropertyModelPTExpt
 else:
     PropertyModelPTExpt = None
@@ -219,7 +233,12 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
 
 @unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestPropertyModelAPIs(unittest.TestCase):
-    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+    """Test consistency of model-level APIs between pt and dpmodel backends.
+
+    Both models are constructed from the same serialized weights
+    (dpmodel -> serialize -> pt deserialize) so that numerical outputs
+    can be compared directly.
+    """
 
     def setUp(self) -> None:
         data = model_args().normalize_value(
@@ -242,18 +261,80 @@ def setUp(self) -> None:
                     "neuron": [4, 4, 4],
                     "property_name": "foo",
                     "resnet_dt": True,
-                    "numb_fparam": 0,
                     "precision": "float64",
                     "seed": 1,
+                    "numb_fparam": 2,
+                    "numb_aparam": 3,
+                    "default_fparam": [0.5, -0.3],
                 },
             },
             trim_pattern="_*",
         )
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = PropertyModelPT.deserialize(serialized)
         self.pt_expt_model = PropertyModelPTExpt.deserialize(serialized)
 
+        # Coords / atype / box
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                00.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Build extended coords + nlist for lower-level calls
+        rcut = 6.0
+        nframes, nloc = self.atype.shape[:2]
+        coord_normalized = normalize_coord(
+            self.coords.reshape(nframes, nloc, 3),
+            self.box.reshape(nframes, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, self.atype, self.box, rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            nloc,
+            rcut,
+            [20, 20],
+            distinguish_types=True,
+        )
+        self.extended_coord = extended_coord.reshape(nframes, -1, 3)
+        self.extended_atype = extended_atype
+        self.mapping = mapping
+        self.nlist = nlist
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        rng = np.random.default_rng(42)
+        self.eval_aparam = rng.normal(size=(1, nloc, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -264,3 +345,1180 @@ def test_translated_output_def(self) -> None:
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
             self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
+
+    def test_get_descriptor(self) -> None:
+        """get_descriptor should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_descriptor())
+        self.assertIsNotNone(self.pt_model.get_descriptor())
+
+    def test_get_fitting_net(self) -> None:
+        """get_fitting_net should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_fitting_net())
+        self.assertIsNotNone(self.pt_model.get_fitting_net())
+
+    def test_get_out_bias(self) -> None:
+        """get_out_bias should return numerically equal values on dp and pt.
+
+        PropertyModel's apply_out_stat applies output * std + bias,
+        so the bias storage should be consistent across backends.
+        """
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        # Verify shape: (n_output_keys x ntypes x task_dim) for property
+        self.assertEqual(dp_bias.shape[1], 2)  # ntypes
+        self.assertGreater(dp_bias.shape[0], 0)  # at least one output key
+
+    def test_set_out_bias(self) -> None:
+        """set_out_bias should update the bias on both backends."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        new_bias = dp_bias + 1.0
+        # dp
+        self.dp_model.set_out_bias(new_bias)
+        np.testing.assert_allclose(
+            to_numpy_array(self.dp_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        # pt
+        self.pt_model.set_out_bias(numpy_to_torch(new_bias))
+        np.testing.assert_allclose(
+            torch_to_numpy(self.pt_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_model_output_def(self) -> None:
+        """model_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.model_output_def().get_data()
+        pt_def = self.pt_model.model_output_def().get_data()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_model_output_type(self) -> None:
+        """model_output_type should return the same list on dp and pt."""
+        self.assertEqual(
+            self.dp_model.model_output_type(),
+            self.pt_model.model_output_type(),
+        )
+
+    def test_do_grad_r(self) -> None:
+        """do_grad_r should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_r("foo"),
+            self.pt_model.do_grad_r("foo"),
+        )
+        self.assertFalse(self.dp_model.do_grad_r("foo"))
+
+    def test_do_grad_c(self) -> None:
+        """do_grad_c should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_c("foo"),
+            self.pt_model.do_grad_c("foo"),
+        )
+        self.assertFalse(self.dp_model.do_grad_c("foo"))
+
+    def test_get_rcut(self) -> None:
+        """get_rcut should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_rcut(), self.pt_model.get_rcut())
+        self.assertAlmostEqual(self.dp_model.get_rcut(), 6.0)
+
+    def test_get_type_map(self) -> None:
+        """get_type_map should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_type_map(), self.pt_model.get_type_map())
+        self.assertEqual(self.dp_model.get_type_map(), ["O", "H"])
+
+    def test_get_sel(self) -> None:
+        """get_sel should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel(), self.pt_model.get_sel())
+        self.assertEqual(self.dp_model.get_sel(), [20, 20])
+
+    def test_get_nsel(self) -> None:
+        """get_nsel should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nsel(), self.pt_model.get_nsel())
+        self.assertEqual(self.dp_model.get_nsel(), 40)
+
+    def test_get_nnei(self) -> None:
+        """get_nnei should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nnei(), self.pt_model.get_nnei())
+        self.assertEqual(self.dp_model.get_nnei(), 40)
+
+    def test_mixed_types(self) -> None:
+        """mixed_types should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.mixed_types(), self.pt_model.mixed_types())
+        # se_e2_a is not mixed-types
+        self.assertFalse(self.dp_model.mixed_types())
+
+    def test_has_message_passing(self) -> None:
+        """has_message_passing should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_message_passing(),
+            self.pt_model.has_message_passing(),
+        )
+        self.assertFalse(self.dp_model.has_message_passing())
+
+    def test_need_sorted_nlist_for_lower(self) -> None:
+        """need_sorted_nlist_for_lower should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.need_sorted_nlist_for_lower(),
+            self.pt_model.need_sorted_nlist_for_lower(),
+        )
+        self.assertFalse(self.dp_model.need_sorted_nlist_for_lower())
+
+    def test_get_dim_fparam(self) -> None:
+        """get_dim_fparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
+        self.assertEqual(self.dp_model.get_dim_fparam(), 2)
+
+    def test_get_dim_aparam(self) -> None:
+        """get_dim_aparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
+        self.assertEqual(self.dp_model.get_dim_aparam(), 3)
+
+    def test_get_sel_type(self) -> None:
+        """get_sel_type should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel_type(), self.pt_model.get_sel_type())
+        self.assertEqual(self.dp_model.get_sel_type(), [0, 1])
+
+    def test_is_aparam_nall(self) -> None:
+        """is_aparam_nall should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
+        self.assertFalse(self.dp_model.is_aparam_nall())
+
+    def test_atomic_output_def(self) -> None:
+        """atomic_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.atomic_output_def()
+        pt_def = self.pt_model.atomic_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def.keys():
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_format_nlist(self) -> None:
+        """format_nlist should produce the same result on dp and pt."""
+        dp_nlist = self.dp_model.format_nlist(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+        )
+        pt_nlist = torch_to_numpy(
+            self.pt_model.format_nlist(
+                numpy_to_torch(self.extended_coord),
+                numpy_to_torch(self.extended_atype),
+                numpy_to_torch(self.nlist),
+            )
+        )
+        np.testing.assert_equal(dp_nlist, pt_nlist)
+
+    def test_forward_common_atomic(self) -> None:
+        """forward_common_atomic should produce consistent results on dp and pt.
+
+        Compares at the atomic_model level, where both backends define this method.
+        """
+        dp_ret = self.dp_model.atomic_model.forward_common_atomic(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+            mapping=self.mapping,
+            aparam=self.eval_aparam,
+        )
+        pt_ret = self.pt_model.atomic_model.forward_common_atomic(
+            numpy_to_torch(self.extended_coord),
+            numpy_to_torch(self.extended_atype),
+            numpy_to_torch(self.nlist),
+            mapping=numpy_to_torch(self.mapping),
+            aparam=numpy_to_torch(self.eval_aparam),
+        )
+        # Compare the common keys
+        common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
+        self.assertTrue(len(common_keys) > 0)
+        for key in common_keys:
+            if dp_ret[key] is not None and pt_ret[key] is not None:
+                np.testing.assert_allclose(
+                    dp_ret[key],
+                    torch_to_numpy(pt_ret[key]),
+                    rtol=1e-10,
+                    atol=1e-10,
+                    err_msg=f"Mismatch in forward_common_atomic key '{key}'",
+                )
+
+    def test_has_default_fparam(self) -> None:
+        """has_default_fparam should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_default_fparam(),
+            self.pt_model.has_default_fparam(),
+        )
+        self.assertTrue(self.dp_model.has_default_fparam())
+
+    def test_get_default_fparam(self) -> None:
+        """get_default_fparam should return consistent values on dp and pt."""
+        dp_val = self.dp_model.get_default_fparam()
+        pt_val = self.pt_model.get_default_fparam()
+        np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
+
+    def _get_fitting_stats(self, model, backend="dp"):
+        """Extract fparam/aparam stats from a model's fitting net."""
+        fitting = model.get_fitting_net()
+        if backend == "pt":
+            return {
+                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
+                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
+                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
+                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
+            }
+        else:
+            return {
+                "fparam_avg": to_numpy_array(fitting.fparam_avg),
+                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
+                "aparam_avg": to_numpy_array(fitting.aparam_avg),
+                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
+            }
+
+    def test_change_out_bias(self) -> None:
+        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+
+        PropertyModel's apply_out_stat applies output * std + bias,
+        so set-by-statistic should change the bias from initial values.
+        """
+        nframes = 2
+        nloc = 6
+        numb_fparam = 2
+        numb_aparam = 3
+        rng = np.random.default_rng(123)
+
+        # Use realistic coords (from setUp, tiled for 2 frames)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        foo_data = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        fparam_data = rng.normal(size=(nframes, numb_fparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        aparam_data = rng.normal(size=(nframes, nloc, numb_aparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dpmodel stat data (numpy)
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "foo": foo_data,
+                "find_foo": np.float32(1.0),
+                "fparam": fparam_data,
+                "aparam": aparam_data,
+            }
+        ]
+        # pt stat data (torch tensors)
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "foo": numpy_to_torch(foo_data),
+                "find_foo": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam_data),
+                "aparam": numpy_to_torch(aparam_data),
+            }
+        ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # Save initial fitting stats (all zeros / ones)
+        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
+
+        # Save initial (zero) bias
+        dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
+
+        # --- Test "set-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
+        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
+            )
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
+            )
+        # Verify fparam/aparam stats actually changed from initial values
+        self.assertFalse(
+            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
+            "set-by-statistic did not update fparam_avg",
+        )
+        self.assertFalse(
+            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
+            "set-by-statistic did not update aparam_avg",
+        )
+
+        # --- Test "change-by-statistic" mode ---
+        dp_bias_before = dp_bias.copy()
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
+        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_chg[stat_key],
+                dp_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pt_stats_chg[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pe_stats_chg[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
+            )
+
+    def test_change_type_map(self) -> None:
+        """change_type_map should produce consistent results on dp and pt.
+
+        Uses a DPA1 (se_atten) descriptor since se_e2_a does not support
+        change_type_map (non-mixed-types descriptors raise NotImplementedError).
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        data = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "neuron": [4, 4, 4],
+                    "property_name": "foo",
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        pt_model = PropertyModelPT.deserialize(dp_model.serialize())
+
+        # Set non-zero out_bias so the swap is non-trivial
+        dp_bias_orig = to_numpy_array(dp_model.get_out_bias()).copy()
+        new_bias = dp_bias_orig.copy()
+        new_bias[:, 0, :] = 1.5  # type 0 ("O")
+        new_bias[:, 1, :] = -3.7  # type 1 ("H")
+        dp_model.set_out_bias(new_bias)
+        pt_model.set_out_bias(numpy_to_torch(new_bias))
+
+        new_type_map = ["H", "O"]
+        dp_model.change_type_map(new_type_map)
+        pt_model.change_type_map(new_type_map)
+
+        # Both should have the new type_map
+        self.assertEqual(dp_model.get_type_map(), new_type_map)
+        self.assertEqual(pt_model.get_type_map(), new_type_map)
+
+        # Out_bias should be reordered consistently between backends
+        dp_bias_new = to_numpy_array(dp_model.get_out_bias())
+        pt_bias_new = torch_to_numpy(pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias_new, pt_bias_new, rtol=1e-10, atol=1e-10)
+
+        # Verify the reorder is correct: old type 0 -> new type 1, old type 1 -> new type 0
+        np.testing.assert_allclose(
+            dp_bias_new[:, 0, :],
+            new_bias[:, 1, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            dp_bias_new[:, 1, :],
+            new_bias[:, 0, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_change_type_map_extend_stat(self) -> None:
+        """change_type_map with model_with_new_type_stat should propagate stats consistently across dp, pt, and pt_expt.
+
+        Verifies that the model-level change_type_map correctly unwraps
+        model_with_new_type_stat.atomic_model before forwarding to the
+        atomic model.
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        small_tm = ["O", "H"]
+        large_tm = ["O", "H", "Li"]
+
+        small_data = model_args_fn().normalize_value(
+            {
+                "type_map": small_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "neuron": [4, 4, 4],
+                    "property_name": "foo",
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        large_data = model_args_fn().normalize_value(
+            {
+                "type_map": large_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 2,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "neuron": [4, 4, 4],
+                    "property_name": "foo",
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        dp_small = get_model_dp(small_data)
+        dp_large = get_model_dp(large_data)
+
+        # Set distinguishable random stats on the large model's descriptor
+        rng = np.random.default_rng(42)
+        desc_large = dp_large.get_descriptor()
+        mean_large, std_large = desc_large.get_stat_mean_and_stddev()
+        mean_rand = rng.random(size=to_numpy_array(mean_large).shape)
+        std_rand = rng.random(size=to_numpy_array(std_large).shape)
+        desc_large.set_stat_mean_and_stddev(mean_rand, std_rand)
+
+        # Build pt and pt_expt models from dp serialization
+        pt_small = PropertyModelPT.deserialize(dp_small.serialize())
+        pt_large = PropertyModelPT.deserialize(dp_large.serialize())
+        pt_expt_small = PropertyModelPTExpt.deserialize(dp_small.serialize())
+        pt_expt_large = PropertyModelPTExpt.deserialize(dp_large.serialize())
+
+        # Extend type map with model_with_new_type_stat at the model level
+        dp_small.change_type_map(large_tm, model_with_new_type_stat=dp_large)
+        pt_small.change_type_map(large_tm, model_with_new_type_stat=pt_large)
+        pt_expt_small.change_type_map(large_tm, model_with_new_type_stat=pt_expt_large)
+
+        # Descriptor stats should be consistent across backends
+        dp_mean, dp_std = dp_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_mean, pt_std = pt_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_expt_mean, pt_expt_std = (
+            pt_expt_small.get_descriptor().get_stat_mean_and_stddev()
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            torch_to_numpy(pt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            torch_to_numpy(pt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            to_numpy_array(pt_expt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            to_numpy_array(pt_expt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_update_sel(self) -> None:
+        """update_sel should return the same result on dp and pt."""
+        from unittest.mock import (
+            patch,
+        )
+
+        from deepmd.dpmodel.model.dp_model import DPModelCommon as DPModelCommonDP
+        from deepmd.pt.model.model.dp_model import DPModelCommon as DPModelCommonPT
+
+        mock_min_nbor_dist = 0.5
+        mock_sel = [10, 20]
+        local_jdata = {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": "auto",
+                "rcut_smth": 0.50,
+                "rcut": 6.00,
+            },
+            "fitting_net": {
+                "type": "property",
+                "neuron": [4, 4, 4],
+                "property_name": "foo",
+            },
+        }
+        type_map = ["O", "H"]
+
+        with patch(
+            "deepmd.dpmodel.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            dp_result, dp_min_dist = DPModelCommonDP.update_sel(
+                None, type_map, local_jdata
+            )
+
+        with patch(
+            "deepmd.pt.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            pt_result, pt_min_dist = DPModelCommonPT.update_sel(
+                None, type_map, local_jdata
+            )
+
+        self.assertEqual(dp_result, pt_result)
+        self.assertEqual(dp_min_dist, pt_min_dist)
+        # Verify sel was actually updated (not still "auto")
+        self.assertIsInstance(dp_result["descriptor"]["sel"], list)
+        self.assertNotEqual(dp_result["descriptor"]["sel"], "auto")
+
+    def test_get_ntypes(self) -> None:
+        """get_ntypes should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_ntypes(), self.pt_model.get_ntypes())
+        self.assertEqual(self.dp_model.get_ntypes(), 2)
+
+    def test_compute_or_load_out_stat(self) -> None:
+        """compute_or_load_out_stat should produce consistent bias on dp and pt.
+
+        Tests both the compute path (from data) and the load path (from file).
+        PropertyModel's apply_out_stat applies output * std + bias,
+        so the stored bias should be consistent across backends.
+        """
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        nframes = 2
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        foo_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 1))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "foo": foo_data,
+                "find_foo": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "foo": numpy_to_torch(foo_data),
+                "find_foo": np.float32(1.0),
+            }
+        ]
+
+        # Verify bias is initially identical
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate h5 files for dp and pt
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            with h5py.File(dp_h5, "w"):
+                pass
+            with h5py.File(pt_h5, "w"):
+                pass
+            dp_stat_path = DPPath(dp_h5, "a")
+            pt_stat_path = DPPath(pt_h5, "a")
+
+            # 1. Compute stats and save to file
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                dp_merged, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                pt_merged, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_after = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_after = torch_to_numpy(self.pt_model.get_out_bias())
+            np.testing.assert_allclose(
+                dp_bias_after, pt_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+            # 2. Verify both backends saved the same file content
+            with h5py.File(dp_h5, "r") as dp_f, h5py.File(pt_h5, "r") as pt_f:
+                dp_keys = sorted(dp_f.keys())
+                pt_keys = sorted(pt_f.keys())
+                self.assertEqual(dp_keys, pt_keys)
+                for key in dp_keys:
+                    np.testing.assert_allclose(
+                        np.array(dp_f[key]),
+                        np.array(pt_f[key]),
+                        rtol=1e-10,
+                        atol=1e-10,
+                        err_msg=f"Stat file content mismatch for key {key}",
+                    )
+
+            # 3. Reset biases to zero, then load from file
+            zero_bias = np.zeros_like(dp_bias_after)
+            self.dp_model.set_out_bias(zero_bias)
+            self.pt_model.set_out_bias(numpy_to_torch(zero_bias))
+
+            # Use a callable that raises to ensure it loads from file, not recomputes
+            def raise_error():
+                raise RuntimeError("Should not recompute — should load from file")
+
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_loaded = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_loaded = torch_to_numpy(self.pt_model.get_out_bias())
+
+            # Loaded biases should match between backends
+            np.testing.assert_allclose(
+                dp_bias_loaded, pt_bias_loaded, rtol=1e-10, atol=1e-10
+            )
+            # Loaded biases should match the originally computed biases
+            np.testing.assert_allclose(
+                dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that type 1 ("H") is
+        unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — type 1 is unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[natoms, natoms, natoms, 0]] * nframes, dtype=np.int32)
+        foo_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 1))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "foo": foo_data,
+                "find_foo": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "foo": numpy_to_torch(foo_data),
+                "find_foo": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # Property model uses stats_distinguish_types=False, so all types
+        # get the same (non-zero) bias — both types appear observed.
+        self.assertEqual(dp_observed, ["O", "H"])
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+    (False, True),  # fparam_in_data
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestPropertyComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd), fitting stats (fparam, aparam), and output bias.
+    Parameterized over exclusion types and whether fparam is explicitly provided or
+    injected via default_fparam.
+    """
+
+    def setUp(self) -> None:
+        (pair_exclude_types, atom_exclude_types), self.fparam_in_data = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "dpa3",
+                    "repflow": {
+                        "n_dim": 20,
+                        "e_dim": 10,
+                        "a_dim": 8,
+                        "nlayers": 3,
+                        "e_rcut": 6.0,
+                        "e_rcut_smth": 5.0,
+                        "e_sel": 10,
+                        "a_rcut": 4.0,
+                        "a_rcut_smth": 3.5,
+                        "a_sel": 8,
+                        "axis_neuron": 4,
+                        "update_angle": True,
+                        "update_style": "res_residual",
+                        "update_residual": 0.1,
+                        "update_residual_init": "const",
+                    },
+                    "precision": "float64",
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "neuron": [10, 10],
+                    "property_name": "foo",
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                    "default_fparam": [0.5, -0.3],
+                    "numb_aparam": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = PropertyModelPT.deserialize(serialized)
+        self.pt_expt_model = PropertyModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array([[natoms, natoms, 2, 4]] * nframes, dtype=np.int32)
+        foo_stat = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        aparam_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "foo": foo_stat,
+            "find_foo": np.float32(1.0),
+            "aparam": aparam_stat,
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "foo": numpy_to_torch(foo_stat),
+            "find_foo": np.float32(1.0),
+            "aparam": numpy_to_torch(aparam_stat),
+        }
+
+        if self.fparam_in_data:
+            fparam_stat = rng.normal(size=(nframes, 2)).astype(
+                GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["fparam"] = fparam_stat
+            pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
+        else:
+            # No fparam -> _make_wrapped_sampler injects default_fparam
+            self.expected_fparam_avg = np.array([0.5, -0.3])
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        self.eval_aparam = rng.normal(size=(1, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(
+            self.coords, self.atype, box=self.box, aparam=self.eval_aparam
+        )
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                aparam=numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                aparam=pt_expt_numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("foo", "atom_foo"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
+        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
+        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        # PropertyModel's apply_out_stat applies output * std + bias, so
+        # output values WILL differ from pre-stat after stat computation.
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("foo", "atom_foo"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 5. Non-triviality checks
+        fit_vars = dp_ser["fitting"]["@variables"]
+        # fparam stats were computed
+        fparam_avg = np.asarray(fit_vars["fparam_avg"])
+        self.assertFalse(
+            np.allclose(fparam_avg, 0.0),
+            "fparam_avg is still zero — fparam stats were not computed",
+        )
+        np.testing.assert_allclose(
+            fparam_avg,
+            self.expected_fparam_avg,
+            rtol=1e-10,
+            atol=1e-10,
+            err_msg="fparam_avg does not match expected values",
+        )
+        # aparam stats were computed
+        aparam_avg = np.asarray(fit_vars["aparam_avg"])
+        self.assertFalse(
+            np.allclose(aparam_avg, 0.0),
+            "aparam_avg is still zero — aparam stats were not computed",
+        )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file
+            self.dp_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(dp_h5, "a")
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: self.pt_sampled, stat_file_path=DPPath(pt_h5, "a")
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = PropertyModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = PropertyModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From 11c02012da4bbd5e360e85f33555d17b14f98700 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 00:25:27 +0800
Subject: [PATCH 31/63] add dos test, fix bug

---
 deepmd/dpmodel/fitting/dos_fitting.py     |   17 +
 source/tests/consistent/model/test_dos.py | 1262 ++++++++++++++++++++-
 2 files changed, 1277 insertions(+), 2 deletions(-)

diff --git a/deepmd/dpmodel/fitting/dos_fitting.py b/deepmd/dpmodel/fitting/dos_fitting.py
index 803f31b30f..c8f145ce15 100644
--- a/deepmd/dpmodel/fitting/dos_fitting.py
+++ b/deepmd/dpmodel/fitting/dos_fitting.py
@@ -15,6 +15,10 @@
 from deepmd.dpmodel.fitting.invar_fitting import (
     InvarFitting,
 )
+from deepmd.dpmodel.output_def import (
+    FittingOutputDef,
+    OutputVariableDef,
+)
 
 if TYPE_CHECKING:
     from deepmd.dpmodel.fitting.general_fitting import (
@@ -75,6 +79,19 @@ def __init__(
             default_fparam=default_fparam,
         )
 
+    def output_def(self) -> FittingOutputDef:
+        return FittingOutputDef(
+            [
+                OutputVariableDef(
+                    self.var_name,
+                    [self.dim_out],
+                    reducible=True,
+                    r_differentiable=False,
+                    c_differentiable=False,
+                ),
+            ]
+        )
+
     @classmethod
     def deserialize(cls, data: dict) -> "GeneralFitting":
         data = data.copy()
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 84437693d6..9c5939b03b 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -6,8 +6,18 @@
 
 import numpy as np
 
+from deepmd.dpmodel.common import (
+    to_numpy_array,
+)
 from deepmd.dpmodel.model.dos_model import DOSModel as DOSModelDP
 from deepmd.dpmodel.model.model import get_model as get_model_dp
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
@@ -18,6 +28,7 @@
     INSTALLED_PT_EXPT,
     INSTALLED_TF,
     CommonTest,
+    parameterized,
 )
 from .common import (
     ModelTest,
@@ -26,6 +37,8 @@
 if INSTALLED_PT:
     from deepmd.pt.model.model import get_model as get_model_pt
     from deepmd.pt.model.model.dos_model import DOSModel as DOSModelPT
+    from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+    from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
 else:
     DOSModelPT = None
 if INSTALLED_TF:
@@ -38,6 +51,7 @@
 else:
     DOSModelJAX = None
 if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.common import to_torch_array as pt_expt_numpy_to_torch
     from deepmd.pt_expt.model import DOSModel as DOSModelPTExpt
 else:
     DOSModelPTExpt = None
@@ -222,7 +236,12 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
 
 @unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestDOSModelAPIs(unittest.TestCase):
-    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+    """Test consistency of model-level APIs between pt and dpmodel backends.
+
+    Both models are constructed from the same serialized weights
+    (dpmodel -> serialize -> pt deserialize) so that numerical outputs
+    can be compared directly.
+    """
 
     def setUp(self) -> None:
         data = model_args().normalize_value(
@@ -245,18 +264,80 @@ def setUp(self) -> None:
                     "numb_dos": 2,
                     "neuron": [4, 4, 4],
                     "resnet_dt": True,
-                    "numb_fparam": 0,
                     "precision": "float64",
                     "seed": 1,
+                    "numb_fparam": 2,
+                    "numb_aparam": 3,
+                    "default_fparam": [0.5, -0.3],
                 },
             },
             trim_pattern="_*",
         )
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = DOSModelPT.deserialize(serialized)
         self.pt_expt_model = DOSModelPTExpt.deserialize(serialized)
 
+        # Coords / atype / box
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                00.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Build extended coords + nlist for lower-level calls
+        rcut = 6.0
+        nframes, nloc = self.atype.shape[:2]
+        coord_normalized = normalize_coord(
+            self.coords.reshape(nframes, nloc, 3),
+            self.box.reshape(nframes, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, self.atype, self.box, rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            nloc,
+            rcut,
+            [20, 20],
+            distinguish_types=True,
+        )
+        self.extended_coord = extended_coord.reshape(nframes, -1, 3)
+        self.extended_atype = extended_atype
+        self.mapping = mapping
+        self.nlist = nlist
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        rng = np.random.default_rng(42)
+        self.eval_aparam = rng.normal(size=(1, nloc, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -267,3 +348,1180 @@ def test_translated_output_def(self) -> None:
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
             self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
+
+    def test_get_descriptor(self) -> None:
+        """get_descriptor should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_descriptor())
+        self.assertIsNotNone(self.pt_model.get_descriptor())
+
+    def test_get_fitting_net(self) -> None:
+        """get_fitting_net should return a non-None object on both backends."""
+        self.assertIsNotNone(self.dp_model.get_fitting_net())
+        self.assertIsNotNone(self.pt_model.get_fitting_net())
+
+    def test_get_out_bias(self) -> None:
+        """get_out_bias should return numerically equal values on dp and pt.
+
+        DOSModel uses default apply_out_stat (per-atom type bias),
+        so the bias storage should be consistent across backends.
+        """
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        # Verify shape: (n_output_keys x ntypes x numb_dos) for dos
+        self.assertEqual(dp_bias.shape[1], 2)  # ntypes
+        self.assertGreater(dp_bias.shape[0], 0)  # at least one output key
+
+    def test_set_out_bias(self) -> None:
+        """set_out_bias should update the bias on both backends."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        new_bias = dp_bias + 1.0
+        # dp
+        self.dp_model.set_out_bias(new_bias)
+        np.testing.assert_allclose(
+            to_numpy_array(self.dp_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        # pt
+        self.pt_model.set_out_bias(numpy_to_torch(new_bias))
+        np.testing.assert_allclose(
+            torch_to_numpy(self.pt_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_model_output_def(self) -> None:
+        """model_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.model_output_def().get_data()
+        pt_def = self.pt_model.model_output_def().get_data()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_model_output_type(self) -> None:
+        """model_output_type should return the same list on dp and pt."""
+        self.assertEqual(
+            self.dp_model.model_output_type(),
+            self.pt_model.model_output_type(),
+        )
+
+    def test_do_grad_r(self) -> None:
+        """do_grad_r should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_r("dos"),
+            self.pt_model.do_grad_r("dos"),
+        )
+        self.assertFalse(self.dp_model.do_grad_r("dos"))
+
+    def test_do_grad_c(self) -> None:
+        """do_grad_c should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_c("dos"),
+            self.pt_model.do_grad_c("dos"),
+        )
+        self.assertFalse(self.dp_model.do_grad_c("dos"))
+
+    def test_get_rcut(self) -> None:
+        """get_rcut should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_rcut(), self.pt_model.get_rcut())
+        self.assertAlmostEqual(self.dp_model.get_rcut(), 6.0)
+
+    def test_get_type_map(self) -> None:
+        """get_type_map should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_type_map(), self.pt_model.get_type_map())
+        self.assertEqual(self.dp_model.get_type_map(), ["O", "H"])
+
+    def test_get_sel(self) -> None:
+        """get_sel should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel(), self.pt_model.get_sel())
+        self.assertEqual(self.dp_model.get_sel(), [20, 20])
+
+    def test_get_nsel(self) -> None:
+        """get_nsel should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nsel(), self.pt_model.get_nsel())
+        self.assertEqual(self.dp_model.get_nsel(), 40)
+
+    def test_get_nnei(self) -> None:
+        """get_nnei should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nnei(), self.pt_model.get_nnei())
+        self.assertEqual(self.dp_model.get_nnei(), 40)
+
+    def test_mixed_types(self) -> None:
+        """mixed_types should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.mixed_types(), self.pt_model.mixed_types())
+        # se_e2_a is not mixed-types
+        self.assertFalse(self.dp_model.mixed_types())
+
+    def test_has_message_passing(self) -> None:
+        """has_message_passing should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_message_passing(),
+            self.pt_model.has_message_passing(),
+        )
+        self.assertFalse(self.dp_model.has_message_passing())
+
+    def test_need_sorted_nlist_for_lower(self) -> None:
+        """need_sorted_nlist_for_lower should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.need_sorted_nlist_for_lower(),
+            self.pt_model.need_sorted_nlist_for_lower(),
+        )
+        self.assertFalse(self.dp_model.need_sorted_nlist_for_lower())
+
+    def test_get_dim_fparam(self) -> None:
+        """get_dim_fparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
+        self.assertEqual(self.dp_model.get_dim_fparam(), 2)
+
+    def test_get_dim_aparam(self) -> None:
+        """get_dim_aparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
+        self.assertEqual(self.dp_model.get_dim_aparam(), 3)
+
+    def test_get_sel_type(self) -> None:
+        """get_sel_type should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel_type(), self.pt_model.get_sel_type())
+        self.assertEqual(self.dp_model.get_sel_type(), [0, 1])
+
+    def test_is_aparam_nall(self) -> None:
+        """is_aparam_nall should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
+        self.assertFalse(self.dp_model.is_aparam_nall())
+
+    def test_atomic_output_def(self) -> None:
+        """atomic_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.atomic_output_def()
+        pt_def = self.pt_model.atomic_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def.keys():
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_format_nlist(self) -> None:
+        """format_nlist should produce the same result on dp and pt."""
+        dp_nlist = self.dp_model.format_nlist(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+        )
+        pt_nlist = torch_to_numpy(
+            self.pt_model.format_nlist(
+                numpy_to_torch(self.extended_coord),
+                numpy_to_torch(self.extended_atype),
+                numpy_to_torch(self.nlist),
+            )
+        )
+        np.testing.assert_equal(dp_nlist, pt_nlist)
+
+    def test_forward_common_atomic(self) -> None:
+        """forward_common_atomic should produce consistent results on dp and pt.
+
+        Compares at the atomic_model level, where both backends define this method.
+        """
+        dp_ret = self.dp_model.atomic_model.forward_common_atomic(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+            mapping=self.mapping,
+            aparam=self.eval_aparam,
+        )
+        pt_ret = self.pt_model.atomic_model.forward_common_atomic(
+            numpy_to_torch(self.extended_coord),
+            numpy_to_torch(self.extended_atype),
+            numpy_to_torch(self.nlist),
+            mapping=numpy_to_torch(self.mapping),
+            aparam=numpy_to_torch(self.eval_aparam),
+        )
+        # Compare the common keys
+        common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
+        self.assertTrue(len(common_keys) > 0)
+        for key in common_keys:
+            if dp_ret[key] is not None and pt_ret[key] is not None:
+                np.testing.assert_allclose(
+                    dp_ret[key],
+                    torch_to_numpy(pt_ret[key]),
+                    rtol=1e-10,
+                    atol=1e-10,
+                    err_msg=f"Mismatch in forward_common_atomic key '{key}'",
+                )
+
+    def test_has_default_fparam(self) -> None:
+        """has_default_fparam should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_default_fparam(),
+            self.pt_model.has_default_fparam(),
+        )
+        self.assertTrue(self.dp_model.has_default_fparam())
+
+    def test_get_default_fparam(self) -> None:
+        """get_default_fparam should return consistent values on dp and pt."""
+        dp_val = self.dp_model.get_default_fparam()
+        pt_val = self.pt_model.get_default_fparam()
+        np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
+
+    def _get_fitting_stats(self, model, backend="dp"):
+        """Extract fparam/aparam stats from a model's fitting net."""
+        fitting = model.get_fitting_net()
+        if backend == "pt":
+            return {
+                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
+                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
+                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
+                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
+            }
+        else:
+            return {
+                "fparam_avg": to_numpy_array(fitting.fparam_avg),
+                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
+                "aparam_avg": to_numpy_array(fitting.aparam_avg),
+                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
+            }
+
+    def test_change_out_bias(self) -> None:
+        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+
+        DOSModel uses default apply_out_stat (per-atom type bias),
+        so set-by-statistic should change the bias from initial values.
+        """
+        nframes = 2
+        nloc = 6
+        numb_fparam = 2
+        numb_aparam = 3
+        rng = np.random.default_rng(123)
+
+        # Use realistic coords (from setUp, tiled for 2 frames)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        dos_data = rng.normal(size=(nframes, 2)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        fparam_data = rng.normal(size=(nframes, numb_fparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        aparam_data = rng.normal(size=(nframes, nloc, numb_aparam)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dpmodel stat data (numpy)
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dos": dos_data,
+                "find_dos": np.float32(1.0),
+                "fparam": fparam_data,
+                "aparam": aparam_data,
+            }
+        ]
+        # pt stat data (torch tensors)
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dos": numpy_to_torch(dos_data),
+                "find_dos": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam_data),
+                "aparam": numpy_to_torch(aparam_data),
+            }
+        ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # Save initial fitting stats (all zeros / ones)
+        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
+
+        # Save initial (zero) bias
+        dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
+
+        # --- Test "set-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
+        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
+            )
+            np.testing.assert_allclose(
+                dp_stats_set[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
+            )
+        # Verify fparam/aparam stats actually changed from initial values
+        self.assertFalse(
+            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
+            "set-by-statistic did not update fparam_avg",
+        )
+        self.assertFalse(
+            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
+            "set-by-statistic did not update aparam_avg",
+        )
+
+        # --- Test "change-by-statistic" mode ---
+        dp_bias_before = dp_bias.copy()
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+
+        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
+        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
+        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
+        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
+        for stat_key in (
+            "fparam_avg",
+            "fparam_inv_std",
+            "aparam_avg",
+            "aparam_inv_std",
+        ):
+            np.testing.assert_allclose(
+                dp_stats_chg[stat_key],
+                dp_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pt_stats_chg[stat_key],
+                pt_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
+            )
+            np.testing.assert_allclose(
+                pe_stats_chg[stat_key],
+                pe_stats_set[stat_key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
+            )
+
+    def test_change_type_map(self) -> None:
+        """change_type_map should produce consistent results on dp and pt.
+
+        Uses a DPA1 (se_atten) descriptor since se_e2_a does not support
+        change_type_map (non-mixed-types descriptors raise NotImplementedError).
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        data = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        pt_model = DOSModelPT.deserialize(dp_model.serialize())
+
+        # Set non-zero out_bias so the swap is non-trivial
+        dp_bias_orig = to_numpy_array(dp_model.get_out_bias()).copy()
+        new_bias = dp_bias_orig.copy()
+        new_bias[:, 0, :] = 1.5  # type 0 ("O")
+        new_bias[:, 1, :] = -3.7  # type 1 ("H")
+        dp_model.set_out_bias(new_bias)
+        pt_model.set_out_bias(numpy_to_torch(new_bias))
+
+        new_type_map = ["H", "O"]
+        dp_model.change_type_map(new_type_map)
+        pt_model.change_type_map(new_type_map)
+
+        # Both should have the new type_map
+        self.assertEqual(dp_model.get_type_map(), new_type_map)
+        self.assertEqual(pt_model.get_type_map(), new_type_map)
+
+        # Out_bias should be reordered consistently between backends
+        dp_bias_new = to_numpy_array(dp_model.get_out_bias())
+        pt_bias_new = torch_to_numpy(pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias_new, pt_bias_new, rtol=1e-10, atol=1e-10)
+
+        # Verify the reorder is correct: old type 0 -> new type 1, old type 1 -> new type 0
+        np.testing.assert_allclose(
+            dp_bias_new[:, 0, :],
+            new_bias[:, 1, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            dp_bias_new[:, 1, :],
+            new_bias[:, 0, :],
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_change_type_map_extend_stat(self) -> None:
+        """change_type_map with model_with_new_type_stat should propagate stats consistently across dp, pt, and pt_expt.
+
+        Verifies that the model-level change_type_map correctly unwraps
+        model_with_new_type_stat.atomic_model before forwarding to the
+        atomic model.
+        """
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        small_tm = ["O", "H"]
+        large_tm = ["O", "H", "Li"]
+
+        small_data = model_args_fn().normalize_value(
+            {
+                "type_map": small_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 1,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+        large_data = model_args_fn().normalize_value(
+            {
+                "type_map": large_tm,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 20,
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "seed": 2,
+                    "attn": 6,
+                    "attn_layer": 0,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [4, 4, 4],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        dp_small = get_model_dp(small_data)
+        dp_large = get_model_dp(large_data)
+
+        # Set distinguishable random stats on the large model's descriptor
+        rng = np.random.default_rng(42)
+        desc_large = dp_large.get_descriptor()
+        mean_large, std_large = desc_large.get_stat_mean_and_stddev()
+        mean_rand = rng.random(size=to_numpy_array(mean_large).shape)
+        std_rand = rng.random(size=to_numpy_array(std_large).shape)
+        desc_large.set_stat_mean_and_stddev(mean_rand, std_rand)
+
+        # Build pt and pt_expt models from dp serialization
+        pt_small = DOSModelPT.deserialize(dp_small.serialize())
+        pt_large = DOSModelPT.deserialize(dp_large.serialize())
+        pt_expt_small = DOSModelPTExpt.deserialize(dp_small.serialize())
+        pt_expt_large = DOSModelPTExpt.deserialize(dp_large.serialize())
+
+        # Extend type map with model_with_new_type_stat at the model level
+        dp_small.change_type_map(large_tm, model_with_new_type_stat=dp_large)
+        pt_small.change_type_map(large_tm, model_with_new_type_stat=pt_large)
+        pt_expt_small.change_type_map(large_tm, model_with_new_type_stat=pt_expt_large)
+
+        # Descriptor stats should be consistent across backends
+        dp_mean, dp_std = dp_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_mean, pt_std = pt_small.get_descriptor().get_stat_mean_and_stddev()
+        pt_expt_mean, pt_expt_std = (
+            pt_expt_small.get_descriptor().get_stat_mean_and_stddev()
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            torch_to_numpy(pt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            torch_to_numpy(pt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_mean),
+            to_numpy_array(pt_expt_mean),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        np.testing.assert_allclose(
+            to_numpy_array(dp_std),
+            to_numpy_array(pt_expt_std),
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_update_sel(self) -> None:
+        """update_sel should return the same result on dp and pt."""
+        from unittest.mock import (
+            patch,
+        )
+
+        from deepmd.dpmodel.model.dp_model import DPModelCommon as DPModelCommonDP
+        from deepmd.pt.model.model.dp_model import DPModelCommon as DPModelCommonPT
+
+        mock_min_nbor_dist = 0.5
+        mock_sel = [10, 20]
+        local_jdata = {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": "auto",
+                "rcut_smth": 0.50,
+                "rcut": 6.00,
+            },
+            "fitting_net": {
+                "type": "dos",
+                "numb_dos": 2,
+                "neuron": [4, 4, 4],
+            },
+        }
+        type_map = ["O", "H"]
+
+        with patch(
+            "deepmd.dpmodel.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            dp_result, dp_min_dist = DPModelCommonDP.update_sel(
+                None, type_map, local_jdata
+            )
+
+        with patch(
+            "deepmd.pt.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            pt_result, pt_min_dist = DPModelCommonPT.update_sel(
+                None, type_map, local_jdata
+            )
+
+        self.assertEqual(dp_result, pt_result)
+        self.assertEqual(dp_min_dist, pt_min_dist)
+        # Verify sel was actually updated (not still "auto")
+        self.assertIsInstance(dp_result["descriptor"]["sel"], list)
+        self.assertNotEqual(dp_result["descriptor"]["sel"], "auto")
+
+    def test_get_ntypes(self) -> None:
+        """get_ntypes should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_ntypes(), self.pt_model.get_ntypes())
+        self.assertEqual(self.dp_model.get_ntypes(), 2)
+
+    def test_compute_or_load_out_stat(self) -> None:
+        """compute_or_load_out_stat should produce consistent bias on dp and pt.
+
+        Tests both the compute path (from data) and the load path (from file).
+        DOSModel uses default apply_out_stat (per-atom type bias),
+        so the stored bias should be consistent across backends.
+        """
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        nframes = 2
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[6, 6, 2, 4], [6, 6, 2, 4]], dtype=np.int32)
+        dos_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 2))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dos": dos_data,
+                "find_dos": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dos": numpy_to_torch(dos_data),
+                "find_dos": np.float32(1.0),
+            }
+        ]
+
+        # Verify bias is initially identical
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate h5 files for dp and pt
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            with h5py.File(dp_h5, "w"):
+                pass
+            with h5py.File(pt_h5, "w"):
+                pass
+            dp_stat_path = DPPath(dp_h5, "a")
+            pt_stat_path = DPPath(pt_h5, "a")
+
+            # 1. Compute stats and save to file
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                dp_merged, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                pt_merged, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_after = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_after = torch_to_numpy(self.pt_model.get_out_bias())
+            np.testing.assert_allclose(
+                dp_bias_after, pt_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+            # 2. Verify both backends saved the same file content
+            with h5py.File(dp_h5, "r") as dp_f, h5py.File(pt_h5, "r") as pt_f:
+                dp_keys = sorted(dp_f.keys())
+                pt_keys = sorted(pt_f.keys())
+                self.assertEqual(dp_keys, pt_keys)
+                for key in dp_keys:
+                    np.testing.assert_allclose(
+                        np.array(dp_f[key]),
+                        np.array(pt_f[key]),
+                        rtol=1e-10,
+                        atol=1e-10,
+                        err_msg=f"Stat file content mismatch for key {key}",
+                    )
+
+            # 3. Reset biases to zero, then load from file
+            zero_bias = np.zeros_like(dp_bias_after)
+            self.dp_model.set_out_bias(zero_bias)
+            self.pt_model.set_out_bias(numpy_to_torch(zero_bias))
+
+            # Use a callable that raises to ensure it loads from file, not recomputes
+            def raise_error():
+                raise RuntimeError("Should not recompute — should load from file")
+
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_loaded = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_loaded = torch_to_numpy(self.pt_model.get_out_bias())
+
+            # Loaded biases should match between backends
+            np.testing.assert_allclose(
+                dp_bias_loaded, pt_bias_loaded, rtol=1e-10, atol=1e-10
+            )
+            # Loaded biases should match the originally computed biases
+            np.testing.assert_allclose(
+                dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that type 1 ("H") is
+        unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — type 1 is unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array([[natoms, natoms, natoms, 0]] * nframes, dtype=np.int32)
+        dos_data = (
+            np.random.default_rng(42)
+            .normal(size=(nframes, 2))
+            .astype(GLOBAL_NP_FLOAT_PRECISION)
+        )
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "dos": dos_data,
+                "find_dos": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "dos": numpy_to_torch(dos_data),
+                "find_dos": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # DOS uses get_compute_stats_distinguish_types()=True (default),
+        # so only observed types get non-zero bias — only type 0 ("O").
+        self.assertEqual(dp_observed, ["O"])
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+    (False, True),  # fparam_in_data
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestDOSComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd), fitting stats (fparam, aparam), and output bias.
+    Parameterized over exclusion types and whether fparam is explicitly provided or
+    injected via default_fparam.
+    """
+
+    def setUp(self) -> None:
+        (pair_exclude_types, atom_exclude_types), self.fparam_in_data = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "dpa3",
+                    "repflow": {
+                        "n_dim": 20,
+                        "e_dim": 10,
+                        "a_dim": 8,
+                        "nlayers": 3,
+                        "e_rcut": 6.0,
+                        "e_rcut_smth": 5.0,
+                        "e_sel": 10,
+                        "a_rcut": 4.0,
+                        "a_rcut_smth": 3.5,
+                        "a_sel": 8,
+                        "axis_neuron": 4,
+                        "update_angle": True,
+                        "update_style": "res_residual",
+                        "update_residual": 0.1,
+                        "update_residual_init": "const",
+                    },
+                    "precision": "float64",
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [10, 10],
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                    "default_fparam": [0.5, -0.3],
+                    "numb_aparam": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DOSModelPT.deserialize(serialized)
+        self.pt_expt_model = DOSModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array([[natoms, natoms, 2, 4]] * nframes, dtype=np.int32)
+        dos_stat = rng.normal(size=(nframes, 2)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        aparam_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "dos": dos_stat,
+            "find_dos": np.float32(1.0),
+            "aparam": aparam_stat,
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "dos": numpy_to_torch(dos_stat),
+            "find_dos": np.float32(1.0),
+            "aparam": numpy_to_torch(aparam_stat),
+        }
+
+        if self.fparam_in_data:
+            fparam_stat = rng.normal(size=(nframes, 2)).astype(
+                GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["fparam"] = fparam_stat
+            pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
+        else:
+            # No fparam -> _make_wrapped_sampler injects default_fparam
+            self.expected_fparam_avg = np.array([0.5, -0.3])
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+        # aparam for forward evaluation (1 frame, 6 atoms, 3 aparam)
+        self.eval_aparam = rng.normal(size=(1, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(
+            self.coords, self.atype, box=self.box, aparam=self.eval_aparam
+        )
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                aparam=numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                aparam=pt_expt_numpy_to_torch(self.eval_aparam),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("dos", "atom_dos"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
+        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
+        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        # DOSModel uses default apply_out_stat (per-atom type bias), so
+        # output values WILL differ from pre-stat after stat computation.
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("dos", "atom_dos"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 5. Non-triviality checks
+        fit_vars = dp_ser["fitting"]["@variables"]
+        # fparam stats were computed
+        fparam_avg = np.asarray(fit_vars["fparam_avg"])
+        self.assertFalse(
+            np.allclose(fparam_avg, 0.0),
+            "fparam_avg is still zero — fparam stats were not computed",
+        )
+        np.testing.assert_allclose(
+            fparam_avg,
+            self.expected_fparam_avg,
+            rtol=1e-10,
+            atol=1e-10,
+            err_msg="fparam_avg does not match expected values",
+        )
+        # aparam stats were computed
+        aparam_avg = np.asarray(fit_vars["aparam_avg"])
+        self.assertFalse(
+            np.allclose(aparam_avg, 0.0),
+            "aparam_avg is still zero — aparam stats were not computed",
+        )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file
+            self.dp_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(dp_h5, "a")
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: self.pt_sampled, stat_file_path=DPPath(pt_h5, "a")
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: self.np_sampled, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = DOSModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = DOSModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From fbfd042f8f1e00053deb2a5e2d8eecf1a92ca9b4 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 12:09:36 +0800
Subject: [PATCH 32/63] add ut for dp-zbl model

---
 deepmd/dpmodel/descriptor/dpa1.py             |   1 +
 deepmd/dpmodel/model/model.py                 |   3 +
 .../tests/consistent/model/test_zbl_ener.py   | 892 +++++++++++++++++-
 3 files changed, 893 insertions(+), 3 deletions(-)

diff --git a/deepmd/dpmodel/descriptor/dpa1.py b/deepmd/dpmodel/descriptor/dpa1.py
index 2f9aa69b62..b43fb87193 100644
--- a/deepmd/dpmodel/descriptor/dpa1.py
+++ b/deepmd/dpmodel/descriptor/dpa1.py
@@ -707,6 +707,7 @@ def __init__(
             sel = [sel]
         self.sel = sel
         self.nnei = sum(sel)
+        self.ndescrpt = self.nnei * 4
         self.ntypes = ntypes
         self.neuron = neuron
         self.filter_neuron = self.neuron
diff --git a/deepmd/dpmodel/model/model.py b/deepmd/dpmodel/model/model.py
index 339998aa89..b560366457 100644
--- a/deepmd/dpmodel/model/model.py
+++ b/deepmd/dpmodel/model/model.py
@@ -115,9 +115,12 @@ def get_standard_model(data: dict) -> EnergyModel:
 
 
 def get_zbl_model(data: dict) -> DPZBLModel:
+    data = copy.deepcopy(data)
     data["descriptor"]["ntypes"] = len(data["type_map"])
+    data["descriptor"]["type_map"] = data["type_map"]
     descriptor = BaseDescriptor(**data["descriptor"])
     fitting_type = data["fitting_net"].pop("type")
+    data["fitting_net"]["type_map"] = data["type_map"]
     if fitting_type == "ener":
         fitting = EnergyFittingNet(
             ntypes=descriptor.get_ntypes(),
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index 88bcd86b2e..2bb7fea2dd 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -1,4 +1,6 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+import copy
+import os
 import unittest
 from typing import (
     Any,
@@ -6,8 +8,18 @@
 
 import numpy as np
 
+from deepmd.dpmodel.common import (
+    to_numpy_array,
+)
 from deepmd.dpmodel.model.dp_zbl_model import DPZBLModel as DPZBLModelDP
 from deepmd.dpmodel.model.model import get_model as get_model_dp
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
 from deepmd.env import (
     GLOBAL_NP_FLOAT_PRECISION,
 )
@@ -27,6 +39,8 @@
 if INSTALLED_PT:
     from deepmd.pt.model.model import get_model as get_model_pt
     from deepmd.pt.model.model.dp_zbl_model import DPZBLModel as DPZBLModelPT
+    from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+    from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
 else:
     DPZBLModelPT = None
 if INSTALLED_JAX:
@@ -35,11 +49,10 @@
 else:
     DPZBLModelJAX = None
 if INSTALLED_PT_EXPT:
+    from deepmd.pt_expt.common import to_torch_array as pt_expt_numpy_to_torch
     from deepmd.pt_expt.model import DPZBLModel as DPZBLModelPTExpt
 else:
     DPZBLModelPTExpt = None
-import os
-
 from deepmd.utils.argcheck import (
     model_args,
 )
@@ -252,7 +265,15 @@ def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
 
 @unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PyTorch is not installed")
 class TestZBLEnerModelAPIs(unittest.TestCase):
-    """Test translated_output_def consistency across dp, pt, and pt_expt backends."""
+    """Test consistency of model-level APIs between pt and dpmodel backends.
+
+    Both models are constructed from the same serialized weights
+    (dpmodel -> serialize -> pt deserialize) so that numerical outputs
+    can be compared directly.
+
+    DPZBLModel is a linear combination model (DP + ZBL) and does NOT
+    support get_descriptor() or get_fitting_net() at the top level.
+    """
 
     def setUp(self) -> None:
         data = model_args().normalize_value(
@@ -284,16 +305,72 @@ def setUp(self) -> None:
                 "fitting_net": {
                     "neuron": [5, 5],
                     "resnet_dt": True,
+                    "precision": "float64",
                     "seed": 1,
                 },
             },
             trim_pattern="_*",
         )
+        # Build dpmodel first, then deserialize into pt/pt_expt to share weights
         self.dp_model = get_model_dp(data)
         serialized = self.dp_model.serialize()
         self.pt_model = DPZBLModelPT.deserialize(serialized)
         self.pt_expt_model = DPZBLModelPTExpt.deserialize(serialized)
 
+        # Coords / atype / box
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                00.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Build extended coords + nlist for lower-level calls
+        rcut = self.dp_model.get_rcut()
+        sel = self.dp_model.get_sel()
+        nframes, nloc = self.atype.shape[:2]
+        coord_normalized = normalize_coord(
+            self.coords.reshape(nframes, nloc, 3),
+            self.box.reshape(nframes, 3, 3),
+        )
+        extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+            coord_normalized, self.atype, self.box, rcut
+        )
+        nlist = build_neighbor_list(
+            extended_coord,
+            extended_atype,
+            nloc,
+            rcut,
+            sel,
+            distinguish_types=False,
+        )
+        self.extended_coord = extended_coord.reshape(nframes, -1, 3)
+        self.extended_atype = extended_atype
+        self.mapping = mapping
+        self.nlist = nlist
+
     def test_translated_output_def(self) -> None:
         """translated_output_def should return the same keys on dp, pt, and pt_expt."""
         dp_def = self.dp_model.translated_output_def()
@@ -304,3 +381,812 @@ def test_translated_output_def(self) -> None:
         for key in dp_def:
             self.assertEqual(dp_def[key].shape, pt_def[key].shape)
             self.assertEqual(dp_def[key].shape, pt_expt_def[key].shape)
+
+    def test_get_out_bias(self) -> None:
+        """get_out_bias should return numerically equal values on dp and pt."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        # Verify shape: ntypes=3 for ZBL model
+        self.assertEqual(dp_bias.shape[1], 3)
+        self.assertGreater(dp_bias.shape[0], 0)
+
+    def test_set_out_bias(self) -> None:
+        """set_out_bias should update the bias on both backends."""
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        new_bias = dp_bias + 1.0
+        # dp
+        self.dp_model.set_out_bias(new_bias)
+        np.testing.assert_allclose(
+            to_numpy_array(self.dp_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+        # pt
+        self.pt_model.set_out_bias(numpy_to_torch(new_bias))
+        np.testing.assert_allclose(
+            torch_to_numpy(self.pt_model.get_out_bias()),
+            new_bias,
+            rtol=1e-10,
+            atol=1e-10,
+        )
+
+    def test_model_output_def(self) -> None:
+        """model_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.model_output_def().get_data()
+        pt_def = self.pt_model.model_output_def().get_data()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def:
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_model_output_type(self) -> None:
+        """model_output_type should return the same list on dp and pt."""
+        self.assertEqual(
+            self.dp_model.model_output_type(),
+            self.pt_model.model_output_type(),
+        )
+
+    def test_do_grad_r(self) -> None:
+        """do_grad_r should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_r("energy"),
+            self.pt_model.do_grad_r("energy"),
+        )
+        self.assertTrue(self.dp_model.do_grad_r("energy"))
+
+    def test_do_grad_c(self) -> None:
+        """do_grad_c should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.do_grad_c("energy"),
+            self.pt_model.do_grad_c("energy"),
+        )
+        self.assertTrue(self.dp_model.do_grad_c("energy"))
+
+    def test_get_rcut(self) -> None:
+        """get_rcut should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_rcut(), self.pt_model.get_rcut())
+
+    def test_get_type_map(self) -> None:
+        """get_type_map should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_type_map(), self.pt_model.get_type_map())
+        self.assertEqual(self.dp_model.get_type_map(), ["O", "H", "B"])
+
+    def test_get_sel(self) -> None:
+        """get_sel should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel(), self.pt_model.get_sel())
+
+    def test_get_nsel(self) -> None:
+        """get_nsel should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nsel(), self.pt_model.get_nsel())
+
+    def test_get_nnei(self) -> None:
+        """get_nnei should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_nnei(), self.pt_model.get_nnei())
+
+    def test_mixed_types(self) -> None:
+        """mixed_types should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.mixed_types(), self.pt_model.mixed_types())
+        # DPZBLModel (LinearEnergyAtomicModel) always uses mixed types
+        self.assertTrue(self.dp_model.mixed_types())
+
+    def test_has_message_passing(self) -> None:
+        """has_message_passing should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.has_message_passing(),
+            self.pt_model.has_message_passing(),
+        )
+        self.assertFalse(self.dp_model.has_message_passing())
+
+    def test_need_sorted_nlist_for_lower(self) -> None:
+        """need_sorted_nlist_for_lower should return the same value on dp and pt."""
+        self.assertEqual(
+            self.dp_model.need_sorted_nlist_for_lower(),
+            self.pt_model.need_sorted_nlist_for_lower(),
+        )
+
+    def test_get_dim_fparam(self) -> None:
+        """get_dim_fparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_fparam(), self.pt_model.get_dim_fparam())
+        self.assertEqual(self.dp_model.get_dim_fparam(), 0)
+
+    def test_get_dim_aparam(self) -> None:
+        """get_dim_aparam should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_dim_aparam(), self.pt_model.get_dim_aparam())
+        self.assertEqual(self.dp_model.get_dim_aparam(), 0)
+
+    def test_get_sel_type(self) -> None:
+        """get_sel_type should return the same list on dp and pt."""
+        self.assertEqual(self.dp_model.get_sel_type(), self.pt_model.get_sel_type())
+
+    def test_is_aparam_nall(self) -> None:
+        """is_aparam_nall should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
+        self.assertFalse(self.dp_model.is_aparam_nall())
+
+    def test_atomic_output_def(self) -> None:
+        """atomic_output_def should return the same keys and shapes on dp and pt."""
+        dp_def = self.dp_model.atomic_output_def()
+        pt_def = self.pt_model.atomic_output_def()
+        self.assertEqual(set(dp_def.keys()), set(pt_def.keys()))
+        for key in dp_def.keys():
+            self.assertEqual(dp_def[key].shape, pt_def[key].shape)
+
+    def test_get_ntypes(self) -> None:
+        """get_ntypes should return the same value on dp and pt."""
+        self.assertEqual(self.dp_model.get_ntypes(), self.pt_model.get_ntypes())
+        self.assertEqual(self.dp_model.get_ntypes(), 3)
+
+    def test_format_nlist(self) -> None:
+        """format_nlist should produce the same result on dp and pt."""
+        dp_nlist = self.dp_model.format_nlist(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+        )
+        pt_nlist = torch_to_numpy(
+            self.pt_model.format_nlist(
+                numpy_to_torch(self.extended_coord),
+                numpy_to_torch(self.extended_atype),
+                numpy_to_torch(self.nlist),
+            )
+        )
+        np.testing.assert_equal(dp_nlist, pt_nlist)
+
+    def test_forward_common_atomic(self) -> None:
+        """forward_common_atomic should produce consistent results on dp and pt.
+
+        Compares at the atomic_model level, where both backends define this method.
+        DPZBLModel has no aparam, so we don't pass aparam here.
+        """
+        dp_ret = self.dp_model.atomic_model.forward_common_atomic(
+            self.extended_coord,
+            self.extended_atype,
+            self.nlist,
+            mapping=self.mapping,
+        )
+        pt_ret = self.pt_model.atomic_model.forward_common_atomic(
+            numpy_to_torch(self.extended_coord),
+            numpy_to_torch(self.extended_atype),
+            numpy_to_torch(self.nlist),
+            mapping=numpy_to_torch(self.mapping),
+        )
+        # Compare the common keys
+        common_keys = set(dp_ret.keys()) & set(pt_ret.keys())
+        self.assertTrue(len(common_keys) > 0)
+        for key in common_keys:
+            if dp_ret[key] is not None and pt_ret[key] is not None:
+                np.testing.assert_allclose(
+                    dp_ret[key],
+                    torch_to_numpy(pt_ret[key]),
+                    rtol=1e-10,
+                    atol=1e-10,
+                    err_msg=f"Mismatch in forward_common_atomic key '{key}'",
+                )
+
+    def test_change_out_bias(self) -> None:
+        """change_out_bias (change-by-statistic) should produce consistent bias on dp, pt, and pt_expt.
+
+        DPZBLModel (LinearEnergyAtomicModel) does not support set-by-statistic
+        (no compute_fitting_input_stat), so only change-by-statistic is tested.
+        We first compute initial bias via compute_or_load_out_stat, then verify
+        change-by-statistic updates bias consistently.
+        """
+        nframes = 2
+        rng = np.random.default_rng(123)
+
+        # Use realistic coords (from setUp, tiled for 2 frames)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        # natoms: [nloc, nloc, n_type0, n_type1, n_type2] — 3 types
+        natoms_data = np.array([[6, 6, 2, 4, 0], [6, 6, 2, 4, 0]], dtype=np.int32)
+        energy_data = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+
+        # dpmodel stat data (numpy)
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "energy": energy_data,
+                "find_energy": np.float32(1.0),
+            }
+        ]
+        # pt stat data (torch tensors)
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "energy": numpy_to_torch(energy_data),
+                "find_energy": np.float32(1.0),
+            }
+        ]
+        # pt_expt stat data (numpy, same as dp)
+        pe_merged = dp_merged
+
+        # First compute initial bias via compute_or_load_out_stat
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        pe_bias_before = to_numpy_array(self.pt_expt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+        np.testing.assert_allclose(
+            dp_bias_before, pe_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        # --- Test "change-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="change-by-statistic"
+        )
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+
+    # test_change_type_map: NOT applicable — PairTabAtomicModel does not
+    # support changing type map (would require rebuilding the tab file),
+    # so LinearEnergyAtomicModel.change_type_map always fails for DPZBLModel
+    # when the new type_map differs from the original.
+
+    # test_change_type_map_extend_stat: NOT applicable — same reason.
+
+    def test_update_sel(self) -> None:
+        """update_sel should return the same result on dp and pt."""
+        from unittest.mock import (
+            patch,
+        )
+
+        from deepmd.dpmodel.model.dp_model import DPModelCommon as DPModelCommonDP
+        from deepmd.pt.model.model.dp_model import DPModelCommon as DPModelCommonPT
+
+        mock_min_nbor_dist = 0.5
+        mock_sel = [30]
+        local_jdata = {
+            "type_map": ["O", "H", "B"],
+            "use_srtab": f"{TESTS_DIR}/pt/water/data/zbl_tab_potential/H2O_tab_potential.txt",
+            "smin_alpha": 0.1,
+            "sw_rmin": 0.2,
+            "sw_rmax": 4.0,
+            "descriptor": {
+                "type": "se_atten",
+                "sel": "auto",
+                "rcut_smth": 0.5,
+                "rcut": 4.0,
+            },
+            "fitting_net": {
+                "neuron": [5, 5],
+            },
+        }
+        type_map = ["O", "H", "B"]
+
+        with patch(
+            "deepmd.dpmodel.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            dp_result, dp_min_dist = DPModelCommonDP.update_sel(
+                None, type_map, local_jdata
+            )
+
+        with patch(
+            "deepmd.pt.utils.update_sel.UpdateSel.get_nbor_stat",
+            return_value=(mock_min_nbor_dist, mock_sel),
+        ):
+            pt_result, pt_min_dist = DPModelCommonPT.update_sel(
+                None, type_map, local_jdata
+            )
+
+        self.assertEqual(dp_result, pt_result)
+        self.assertEqual(dp_min_dist, pt_min_dist)
+        # Verify sel was actually updated (not still "auto")
+        self.assertNotEqual(dp_result["descriptor"]["sel"], "auto")
+
+    def test_compute_or_load_out_stat(self) -> None:
+        """compute_or_load_out_stat should produce consistent bias on dp and pt.
+
+        Tests both the compute path (from data) and the load path (from file).
+        """
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        nframes = 2
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        atype_2f = np.array([[0, 0, 1, 1, 1, 1], [0, 1, 1, 0, 1, 1]], dtype=np.int32)
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        # natoms: [nloc, nloc, n_type0, n_type1, n_type2] — 3 types
+        natoms_data = np.array([[6, 6, 2, 4, 0], [6, 6, 2, 4, 0]], dtype=np.int32)
+        energy_data = np.array([10.0, 20.0]).reshape(nframes, 1)
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "energy": energy_data,
+                "find_energy": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "energy": numpy_to_torch(energy_data),
+                "find_energy": np.float32(1.0),
+            }
+        ]
+
+        # Verify bias is initially identical
+        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
+        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
+        np.testing.assert_allclose(
+            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate h5 files for dp and pt
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            with h5py.File(dp_h5, "w"):
+                pass
+            with h5py.File(pt_h5, "w"):
+                pass
+            dp_stat_path = DPPath(dp_h5, "a")
+            pt_stat_path = DPPath(pt_h5, "a")
+
+            # 1. Compute stats and save to file
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                dp_merged, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                pt_merged, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_after = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_after = torch_to_numpy(self.pt_model.get_out_bias())
+            np.testing.assert_allclose(
+                dp_bias_after, pt_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+            # Verify bias actually changed (not still all zeros)
+            self.assertFalse(
+                np.allclose(dp_bias_after, dp_bias_before),
+                "compute_or_load_out_stat did not change the bias",
+            )
+
+            # 2. Verify both backends saved the same file content
+            with h5py.File(dp_h5, "r") as dp_f, h5py.File(pt_h5, "r") as pt_f:
+                dp_keys = sorted(dp_f.keys())
+                pt_keys = sorted(pt_f.keys())
+                self.assertEqual(dp_keys, pt_keys)
+                for key in dp_keys:
+                    np.testing.assert_allclose(
+                        np.array(dp_f[key]),
+                        np.array(pt_f[key]),
+                        rtol=1e-10,
+                        atol=1e-10,
+                        err_msg=f"Stat file content mismatch for key {key}",
+                    )
+
+            # 3. Reset biases to zero, then load from file
+            zero_bias = np.zeros_like(dp_bias_after)
+            self.dp_model.set_out_bias(zero_bias)
+            self.pt_model.set_out_bias(numpy_to_torch(zero_bias))
+
+            # Use a callable that raises to ensure it loads from file, not recomputes
+            def raise_error():
+                raise RuntimeError("Should not recompute — should load from file")
+
+            self.dp_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=dp_stat_path
+            )
+            self.pt_model.atomic_model.compute_or_load_out_stat(
+                raise_error, stat_file_path=pt_stat_path
+            )
+
+            dp_bias_loaded = to_numpy_array(self.dp_model.get_out_bias())
+            pt_bias_loaded = torch_to_numpy(self.pt_model.get_out_bias())
+
+            # Loaded biases should match between backends
+            np.testing.assert_allclose(
+                dp_bias_loaded, pt_bias_loaded, rtol=1e-10, atol=1e-10
+            )
+            # Loaded biases should match the originally computed biases
+            np.testing.assert_allclose(
+                dp_bias_loaded, dp_bias_after, rtol=1e-10, atol=1e-10
+            )
+
+    def test_get_observed_type_list(self) -> None:
+        """get_observed_type_list should be consistent across dp, pt, pt_expt.
+
+        Uses mock data containing only type 0 ("O") so that types 1 ("H")
+        and 2 ("B") are unobserved and should be absent from the returned list.
+        """
+        nframes = 2
+        natoms = 6
+        # All atoms are type 0 — types 1, 2 are unobserved
+        atype_2f = np.zeros((nframes, natoms), dtype=np.int32)
+        coords_2f = np.tile(self.coords, (nframes, 1, 1))
+        box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
+        natoms_data = np.array(
+            [[natoms, natoms, natoms, 0, 0]] * nframes, dtype=np.int32
+        )
+        energy_data = np.array([10.0, 20.0]).reshape(nframes, 1)
+
+        dp_merged = [
+            {
+                "coord": coords_2f,
+                "atype": atype_2f,
+                "atype_ext": atype_2f,
+                "box": box_2f,
+                "natoms": natoms_data,
+                "energy": energy_data,
+                "find_energy": np.float32(1.0),
+            }
+        ]
+        pt_merged = [
+            {
+                "coord": numpy_to_torch(coords_2f),
+                "atype": numpy_to_torch(atype_2f),
+                "atype_ext": numpy_to_torch(atype_2f),
+                "box": numpy_to_torch(box_2f),
+                "natoms": numpy_to_torch(natoms_data),
+                "energy": numpy_to_torch(energy_data),
+                "find_energy": np.float32(1.0),
+            }
+        ]
+
+        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
+        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+
+        dp_observed = self.dp_model.get_observed_type_list()
+        pt_observed = self.pt_model.get_observed_type_list()
+        pe_observed = self.pt_expt_model.get_observed_type_list()
+
+        self.assertEqual(dp_observed, pt_observed)
+        self.assertEqual(dp_observed, pe_observed)
+        # Only type 0 ("O") should be observed
+        self.assertEqual(dp_observed, ["O"])
+
+
+def _compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
+
+
+@parameterized(
+    (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
+)
+@unittest.skipUnless(INSTALLED_PT and INSTALLED_PT_EXPT, "PT and PT_EXPT are required")
+class TestZBLComputeOrLoadStat(unittest.TestCase):
+    """Test that compute_or_load_stat produces identical statistics on dp, pt, and pt_expt.
+
+    Covers descriptor stats (dstd) and output bias for DPZBLModel.
+    Parameterized over exclusion types only (no fparam — LinearEnergyAtomicModel
+    does not expose fitting_net for param stats).
+    """
+
+    def setUp(self) -> None:
+        ((pair_exclude_types, atom_exclude_types),) = self.param
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H", "B"],
+                "use_srtab": f"{TESTS_DIR}/pt/water/data/zbl_tab_potential/H2O_tab_potential.txt",
+                "smin_alpha": 0.1,
+                "sw_rmin": 0.2,
+                "sw_rmax": 4.0,
+                "pair_exclude_types": pair_exclude_types,
+                "atom_exclude_types": atom_exclude_types,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 40,
+                    "rcut_smth": 0.5,
+                    "rcut": 4.0,
+                    "neuron": [3, 6],
+                    "axis_neuron": 2,
+                    "attn": 8,
+                    "attn_layer": 2,
+                    "attn_dotr": True,
+                    "attn_mask": False,
+                    "activation_function": "tanh",
+                    "scaling_factor": 1.0,
+                    "normalize": False,
+                    "temperature": 1.0,
+                    "set_davg_zero": True,
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Save data for reuse in load-from-file test
+        self._model_data = data
+
+        # Build dp model, then deserialize into pt and pt_expt to share weights
+        self.dp_model = get_model_dp(data)
+        serialized = self.dp_model.serialize()
+        self.pt_model = DPZBLModelPT.deserialize(serialized)
+        self.pt_expt_model = DPZBLModelPTExpt.deserialize(serialized)
+
+        # Test coords / atype / box for forward evaluation
+        self.coords = np.array(
+            [
+                12.83,
+                2.56,
+                2.18,
+                12.09,
+                2.87,
+                2.74,
+                0.25,
+                3.32,
+                1.68,
+                3.36,
+                3.00,
+                1.81,
+                3.51,
+                2.51,
+                2.60,
+                4.27,
+                3.22,
+                1.56,
+            ],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, -1, 3)
+        self.atype = np.array([0, 1, 1, 0, 1, 1], dtype=np.int32).reshape(1, -1)
+        self.box = np.array(
+            [13.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 13.0],
+            dtype=GLOBAL_NP_FLOAT_PRECISION,
+        ).reshape(1, 9)
+
+        # Mock training data for compute_or_load_stat
+        natoms = 6
+        nframes = 3
+        rng = np.random.default_rng(42)
+        coords_stat = rng.normal(size=(nframes, natoms, 3)).astype(
+            GLOBAL_NP_FLOAT_PRECISION
+        )
+        atype_stat = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box_stat = np.tile(
+            np.eye(3, dtype=GLOBAL_NP_FLOAT_PRECISION).reshape(1, 3, 3) * 13.0,
+            (nframes, 1, 1),
+        )
+        natoms_stat = np.array(
+            [[natoms, natoms, 2, 4, 0]] * nframes, dtype=np.int32
+        )  # 3 types: O=2, H=4, B=0
+        energy_stat = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+
+        # dp / pt_expt sample (numpy)
+        np_sample = {
+            "coord": coords_stat,
+            "atype": atype_stat,
+            "atype_ext": atype_stat,
+            "box": box_stat,
+            "natoms": natoms_stat,
+            "energy": energy_stat,
+            "find_energy": np.float32(1.0),
+        }
+        # pt sample (torch tensors)
+        pt_sample = {
+            "coord": numpy_to_torch(coords_stat),
+            "atype": numpy_to_torch(atype_stat),
+            "atype_ext": numpy_to_torch(atype_stat),
+            "box": numpy_to_torch(box_stat),
+            "natoms": numpy_to_torch(natoms_stat),
+            "energy": numpy_to_torch(energy_stat),
+            "find_energy": np.float32(1.0),
+        }
+
+        self.np_sampled = [np_sample]
+        self.pt_sampled = [pt_sample]
+
+    def _eval_dp(self) -> dict:
+        return self.dp_model(self.coords, self.atype, box=self.box)
+
+    def _eval_pt(self) -> dict:
+        return {
+            kk: torch_to_numpy(vv)
+            for kk, vv in self.pt_model(
+                numpy_to_torch(self.coords),
+                numpy_to_torch(self.atype),
+                box=numpy_to_torch(self.box),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def _eval_pt_expt(self) -> dict:
+        coord_t = pt_expt_numpy_to_torch(self.coords)
+        coord_t.requires_grad_(True)
+        return {
+            k: v.detach().cpu().numpy()
+            for k, v in self.pt_expt_model(
+                coord_t,
+                pt_expt_numpy_to_torch(self.atype),
+                box=pt_expt_numpy_to_torch(self.box),
+                do_atomic_virial=True,
+            ).items()
+        }
+
+    def test_compute_stat(self) -> None:
+        # 1. Pre-stat forward consistency
+        dp_ret0 = self._eval_dp()
+        pt_ret0 = self._eval_pt()
+        pe_ret0 = self._eval_pt_expt()
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pt_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret0[key],
+                pe_ret0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Pre-stat dp vs pt_expt mismatch in {key}",
+            )
+
+        # 2. Run compute_or_load_stat on all three backends
+        # deepcopy samples: the ZBL model's stat path mutates natoms in-place
+        # (stat.py applies atom_exclude_types mask via natoms[:, 2:] *= type_mask),
+        # so each backend must receive its own copy.
+        self.dp_model.compute_or_load_stat(lambda: copy.deepcopy(self.np_sampled))
+        self.pt_model.compute_or_load_stat(lambda: copy.deepcopy(self.pt_sampled))
+        self.pt_expt_model.compute_or_load_stat(lambda: copy.deepcopy(self.np_sampled))
+
+        # 3. Serialize all three and compare @variables
+        dp_ser = self.dp_model.serialize()
+        pt_ser = self.pt_model.serialize()
+        pe_ser = self.pt_expt_model.serialize()
+        _compare_variables_recursive(dp_ser, pt_ser)
+        _compare_variables_recursive(dp_ser, pe_ser)
+
+        # 4. Post-stat forward consistency
+        dp_ret1 = self._eval_dp()
+        pt_ret1 = self._eval_pt()
+        pe_ret1 = self._eval_pt_expt()
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pt_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp_ret1[key],
+                pe_ret1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"Post-stat dp vs pt_expt mismatch in {key}",
+            )
+
+    def test_load_stat_from_file(self) -> None:
+        import tempfile
+        from pathlib import (
+            Path,
+        )
+
+        import h5py
+
+        from deepmd.utils.path import (
+            DPPath,
+        )
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create separate stat files for each backend
+            dp_h5 = str((Path(tmpdir) / "dp_stat.h5").resolve())
+            pt_h5 = str((Path(tmpdir) / "pt_stat.h5").resolve())
+            pe_h5 = str((Path(tmpdir) / "pe_stat.h5").resolve())
+            for p in (dp_h5, pt_h5, pe_h5):
+                with h5py.File(p, "w"):
+                    pass
+
+            # 1. Compute stats and save to file (deepcopy: stat path mutates natoms)
+            self.dp_model.compute_or_load_stat(
+                lambda: copy.deepcopy(self.np_sampled),
+                stat_file_path=DPPath(dp_h5, "a"),
+            )
+            self.pt_model.compute_or_load_stat(
+                lambda: copy.deepcopy(self.pt_sampled),
+                stat_file_path=DPPath(pt_h5, "a"),
+            )
+            self.pt_expt_model.compute_or_load_stat(
+                lambda: copy.deepcopy(self.np_sampled),
+                stat_file_path=DPPath(pe_h5, "a"),
+            )
+
+            # Save the computed serializations as reference
+            dp_ser_computed = self.dp_model.serialize()
+            pt_ser_computed = self.pt_model.serialize()
+            pe_ser_computed = self.pt_expt_model.serialize()
+
+            # 2. Build fresh models from the same initial weights
+            dp_model2 = get_model_dp(self._model_data)
+            pt_model2 = DPZBLModelPT.deserialize(dp_model2.serialize())
+            pe_model2 = DPZBLModelPTExpt.deserialize(dp_model2.serialize())
+
+            # 3. Load stats from file (should NOT call the sampled func)
+            def raise_error():
+                raise RuntimeError("Should load from file, not recompute")
+
+            dp_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(dp_h5, "a")
+            )
+            pt_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pt_h5, "a")
+            )
+            pe_model2.compute_or_load_stat(
+                raise_error, stat_file_path=DPPath(pe_h5, "a")
+            )
+
+            # 4. Loaded models should match the computed ones
+            dp_ser_loaded = dp_model2.serialize()
+            pt_ser_loaded = pt_model2.serialize()
+            pe_ser_loaded = pe_model2.serialize()
+            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+
+            # 5. Cross-backend consistency after loading
+            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From b49a10f6744f0ce8fa6626563d476f387836c481 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 12:18:11 +0800
Subject: [PATCH 33/63] add test_get_model_def_script test_get_min_nbor_dist
 test_set_case_embd to model tests

---
 source/tests/consistent/model/test_dipole.py  | 122 ++++++++++++++++
 source/tests/consistent/model/test_dos.py     | 123 ++++++++++++++++
 source/tests/consistent/model/test_polar.py   | 122 ++++++++++++++++
 .../tests/consistent/model/test_property.py   | 123 ++++++++++++++++
 .../tests/consistent/model/test_zbl_ener.py   | 132 ++++++++++++++++++
 5 files changed, 622 insertions(+)

diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index 03468f9d04..b75101228d 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -508,6 +508,128 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dipole",
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = DipoleModelPT.deserialize(serialized)
+        pe_model = DipoleModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("dipole", "global_dipole"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["global_dipole"], dp1["global_dipole"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same global_dipole",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 9c5939b03b..125ba2a5fe 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -491,6 +491,129 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "dos",
+                    "numb_dos": 2,
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = DOSModelPT.deserialize(serialized)
+        pe_model = DOSModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("dos", "atom_dos"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["dos"], dp1["dos"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same dos",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 7d2136bac3..46162a39e9 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -502,6 +502,128 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "polar",
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = PolarModelPT.deserialize(serialized)
+        pe_model = PolarModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("polar", "global_polar"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["global_polar"], dp1["global_polar"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same global_polar",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index d3829fbad7..47d90eae4b 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -488,6 +488,129 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "type": "property",
+                    "property_name": "foo",
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = PropertyModelPT.deserialize(serialized)
+        pe_model = PropertyModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("foo", "atom_foo"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["foo"], dp1["foo"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same foo",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index 2bb7fea2dd..3d4327a7db 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -504,6 +504,138 @@ def test_is_aparam_nall(self) -> None:
         self.assertEqual(self.dp_model.is_aparam_nall(), self.pt_model.is_aparam_nall())
         self.assertFalse(self.dp_model.is_aparam_nall())
 
+    def test_get_model_def_script(self) -> None:
+        """get_model_def_script should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_model_def_script()
+        pt_val = self.pt_model.get_model_def_script()
+        pe_val = self.pt_expt_model.get_model_def_script()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_get_min_nbor_dist(self) -> None:
+        """get_min_nbor_dist should return the same value on dp, pt, and pt_expt."""
+        dp_val = self.dp_model.get_min_nbor_dist()
+        pt_val = self.pt_model.get_min_nbor_dist()
+        pe_val = self.pt_expt_model.get_min_nbor_dist()
+        self.assertEqual(dp_val, pt_val)
+        self.assertEqual(dp_val, pe_val)
+
+    def test_set_case_embd(self) -> None:
+        """set_case_embd should produce consistent results across backends.
+
+        Also verifies that different case indices produce different outputs,
+        confirming the embedding is actually used.
+        """
+        from deepmd.utils.argcheck import (
+            model_args,
+        )
+
+        # Build a model with dim_case_embd > 0
+        data = model_args().normalize_value(
+            {
+                "type_map": ["O", "H", "B"],
+                "use_srtab": f"{TESTS_DIR}/pt/water/data/zbl_tab_potential/H2O_tab_potential.txt",
+                "smin_alpha": 0.1,
+                "sw_rmin": 0.2,
+                "sw_rmax": 4.0,
+                "descriptor": {
+                    "type": "se_atten",
+                    "sel": 40,
+                    "rcut_smth": 0.5,
+                    "rcut": 4.0,
+                    "neuron": [3, 6],
+                    "axis_neuron": 2,
+                    "attn": 8,
+                    "attn_layer": 2,
+                    "attn_dotr": True,
+                    "attn_mask": False,
+                    "activation_function": "tanh",
+                    "scaling_factor": 1.0,
+                    "normalize": False,
+                    "temperature": 1.0,
+                    "set_davg_zero": True,
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "dim_case_embd": 3,
+                },
+            },
+            trim_pattern="_*",
+        )
+        dp_model = get_model_dp(data)
+        serialized = dp_model.serialize()
+        pt_model = DPZBLModelPT.deserialize(serialized)
+        pe_model = DPZBLModelPTExpt.deserialize(serialized)
+
+        def _eval(case_idx):
+            dp_model.set_case_embd(case_idx)
+            pt_model.set_case_embd(case_idx)
+            pe_model.set_case_embd(case_idx)
+            dp_ret = dp_model(self.coords, self.atype, box=self.box)
+            pt_ret = {
+                k: torch_to_numpy(v)
+                for k, v in pt_model(
+                    numpy_to_torch(self.coords),
+                    numpy_to_torch(self.atype),
+                    box=numpy_to_torch(self.box),
+                ).items()
+            }
+            coord_t = pt_expt_numpy_to_torch(self.coords)
+            coord_t.requires_grad_(True)
+            pe_ret = {
+                k: v.detach().cpu().numpy()
+                for k, v in pe_model(
+                    coord_t,
+                    pt_expt_numpy_to_torch(self.atype),
+                    box=pt_expt_numpy_to_torch(self.box),
+                ).items()
+            }
+            return dp_ret, pt_ret, pe_ret
+
+        dp0, pt0, pe0 = _eval(0)
+        dp1, pt1, pe1 = _eval(1)
+
+        # Cross-backend consistency for each case index
+        for key in ("energy", "atom_energy"):
+            np.testing.assert_allclose(
+                dp0[key],
+                pt0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp0[key],
+                pe0[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 0: dp vs pt_expt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pt1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt mismatch in {key}",
+            )
+            np.testing.assert_allclose(
+                dp1[key],
+                pe1[key],
+                rtol=1e-10,
+                atol=1e-10,
+                err_msg=f"case 1: dp vs pt_expt mismatch in {key}",
+            )
+        # Different case indices should produce different outputs
+        self.assertFalse(
+            np.allclose(dp0["energy"], dp1["energy"]),
+            "set_case_embd(0) and set_case_embd(1) produced the same energy",
+        )
+
     def test_atomic_output_def(self) -> None:
         """atomic_output_def should return the same keys and shapes on dp and pt."""
         dp_def = self.dp_model.atomic_output_def()

From d42c8d8ff8ef5de3a1983e87b6d7a319d6ee0e7c Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 12:04:05 +0800
Subject: [PATCH 34/63] chore(pt): mv the input stat update to
 model_change_out_bias to keep the logic of change_out_bias clean

---
 deepmd/pt/model/model/make_model.py |   2 -
 deepmd/pt/train/training.py         |   7 ++
 source/tests/pt/test_training.py    | 118 ++++++++++++++++++++++++++++
 3 files changed, 125 insertions(+), 2 deletions(-)

diff --git a/deepmd/pt/model/model/make_model.py b/deepmd/pt/model/model/make_model.py
index 1cd7f3915f..2c08c4f6c5 100644
--- a/deepmd/pt/model/model/make_model.py
+++ b/deepmd/pt/model/model/make_model.py
@@ -233,8 +233,6 @@ def change_out_bias(
                 merged,
                 bias_adjust_mode=bias_adjust_mode,
             )
-            if bias_adjust_mode == "set-by-statistic":
-                self.atomic_model.compute_fitting_input_stat(merged)
 
         def forward_common_lower(
             self,
diff --git a/deepmd/pt/train/training.py b/deepmd/pt/train/training.py
index 9d2298febc..4bab617650 100644
--- a/deepmd/pt/train/training.py
+++ b/deepmd/pt/train/training.py
@@ -1825,6 +1825,13 @@ def model_change_out_bias(
     )
     new_bias = deepcopy(_model.get_out_bias())
 
+    from deepmd.pt.model.model.dp_model import (
+        DPModelCommon,
+    )
+
+    if isinstance(_model, DPModelCommon) and _bias_adjust_mode == "set-by-statistic":
+        _model.get_fitting_net().compute_input_stats(_sample_func)
+
     model_type_map = _model.get_type_map()
     log.info(
         f"Change output bias of {model_type_map!s} from {to_numpy_array(old_bias).reshape(-1)!s} to {to_numpy_array(new_bias).reshape(-1)!s}."
diff --git a/source/tests/pt/test_training.py b/source/tests/pt/test_training.py
index ff4f00f912..7ab37253bd 100644
--- a/source/tests/pt/test_training.py
+++ b/source/tests/pt/test_training.py
@@ -10,6 +10,7 @@
     Path,
 )
 
+import numpy as np
 import torch
 
 from deepmd.pt.entrypoints.main import (
@@ -608,5 +609,122 @@ def tearDown(self) -> None:
         DPTrainTest.tearDown(self)
 
 
+class TestModelChangeOutBiasFittingStat(unittest.TestCase):
+    """Verify model_change_out_bias produces the same fitting stat as the old code path.
+
+    The old code called compute_fitting_input_stat inside change_out_bias (make_model.py).
+    The new code calls get_fitting_net().compute_input_stats() separately in
+    model_change_out_bias (training.py). This test verifies they produce identical
+    out_bias, fparam_avg, and fparam_inv_std.
+    """
+
+    def test_fitting_stat_consistency(self) -> None:
+        from deepmd.pt.model.model import get_model as get_model_pt
+        from deepmd.pt.model.model.ener_model import EnergyModel as EnergyModelPT
+        from deepmd.pt.train.training import (
+            model_change_out_bias,
+        )
+        from deepmd.pt.utils.utils import to_numpy_array as torch_to_numpy
+        from deepmd.pt.utils.utils import to_torch_tensor as numpy_to_torch
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        # Build a model with numb_fparam=2 so fitting stat is non-trivial
+        model_params = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Create two identical models via serialize/deserialize
+        model_orig = get_model_pt(model_params)
+        serialized = model_orig.serialize()
+        model_a = EnergyModelPT.deserialize(deepcopy(serialized))
+        model_b = EnergyModelPT.deserialize(deepcopy(serialized))
+
+        # Build mock stat data with fparam
+        nframes = 4
+        natoms = 6
+        coords = np.random.default_rng(42).random((nframes, natoms, 3)) * 13.0
+        atype = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box = np.tile(
+            np.eye(3, dtype=np.float64).reshape(1, 3, 3) * 13.0, (nframes, 1, 1)
+        )
+        natoms_data = np.array([[6, 6, 2, 4]] * nframes, dtype=np.int32)
+        energy = np.array([10.0, 20.0, 15.0, 25.0]).reshape(nframes, 1)
+        # fparam with varying values so mean != 0 and std != 0
+        fparam = np.array(
+            [[1.0, 3.0], [5.0, 7.0], [2.0, 8.0], [6.0, 4.0]], dtype=np.float64
+        )
+
+        merged = [
+            {
+                "coord": numpy_to_torch(coords),
+                "atype": numpy_to_torch(atype),
+                "atype_ext": numpy_to_torch(atype),
+                "box": numpy_to_torch(box),
+                "natoms": numpy_to_torch(natoms_data),
+                "energy": numpy_to_torch(energy),
+                "find_energy": np.float32(1.0),
+                "fparam": numpy_to_torch(fparam),
+                "find_fparam": np.float32(1.0),
+            }
+        ]
+
+        # Model A: simulate the OLD code path
+        # old change_out_bias called both bias adjustment + compute_fitting_input_stat
+        model_a.change_out_bias(merged, bias_adjust_mode="set-by-statistic")
+        model_a.atomic_model.compute_fitting_input_stat(merged)
+
+        # Model B: use the NEW code path via model_change_out_bias
+        sample_func = lambda: merged  # noqa: E731
+        model_change_out_bias(model_b, sample_func, "set-by-statistic")
+
+        # Compare out_bias
+        bias_a = torch_to_numpy(model_a.get_out_bias())
+        bias_b = torch_to_numpy(model_b.get_out_bias())
+        np.testing.assert_allclose(bias_a, bias_b, rtol=1e-10, atol=1e-10)
+
+        # Compare fparam_avg and fparam_inv_std
+        fit_a = model_a.get_fitting_net()
+        fit_b = model_b.get_fitting_net()
+        fparam_avg_a = torch_to_numpy(fit_a.fparam_avg)
+        fparam_avg_b = torch_to_numpy(fit_b.fparam_avg)
+        fparam_inv_std_a = torch_to_numpy(fit_a.fparam_inv_std)
+        fparam_inv_std_b = torch_to_numpy(fit_b.fparam_inv_std)
+
+        np.testing.assert_allclose(fparam_avg_a, fparam_avg_b, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(
+            fparam_inv_std_a, fparam_inv_std_b, rtol=1e-10, atol=1e-10
+        )
+
+        # Verify non-trivial: avg should not be zeros, inv_std should not be ones
+        assert not np.allclose(fparam_avg_a, 0.0), (
+            "fparam_avg is still zero — stat was not computed"
+        )
+        assert not np.allclose(fparam_inv_std_a, 1.0), (
+            "fparam_inv_std is still ones — stat was not computed"
+        )
+
+
 if __name__ == "__main__":
     unittest.main()

From b7af468e7f2d5a711c16e9a84e071caecc1af685 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 12:28:52 +0800
Subject: [PATCH 35/63] chore(pd): update in the same way as pt

---
 deepmd/pd/model/model/make_model.py |   2 -
 deepmd/pd/train/training.py         |   7 ++
 source/tests/pd/test_training.py    | 117 ++++++++++++++++++++++++++++
 3 files changed, 124 insertions(+), 2 deletions(-)

diff --git a/deepmd/pd/model/model/make_model.py b/deepmd/pd/model/model/make_model.py
index 1f46cb98c7..d98bee7ed9 100644
--- a/deepmd/pd/model/model/make_model.py
+++ b/deepmd/pd/model/model/make_model.py
@@ -249,8 +249,6 @@ def change_out_bias(
                 merged,
                 bias_adjust_mode=bias_adjust_mode,
             )
-            if bias_adjust_mode == "set-by-statistic":
-                self.atomic_model.compute_fitting_input_stat(merged)
 
         def forward_common_lower(
             self,
diff --git a/deepmd/pd/train/training.py b/deepmd/pd/train/training.py
index dbcbe8d9f6..4e919454eb 100644
--- a/deepmd/pd/train/training.py
+++ b/deepmd/pd/train/training.py
@@ -1417,6 +1417,13 @@ def model_change_out_bias(
     )
     new_bias = deepcopy(_model.get_out_bias())
 
+    from deepmd.pd.model.model.dp_model import (
+        DPModelCommon,
+    )
+
+    if isinstance(_model, DPModelCommon) and _bias_adjust_mode == "set-by-statistic":
+        _model.get_fitting_net().compute_input_stats(_sample_func)
+
     model_type_map = _model.get_type_map()
     log.info(
         f"Change output bias of {model_type_map!s} "
diff --git a/source/tests/pd/test_training.py b/source/tests/pd/test_training.py
index 692a8fb32f..625d1996de 100644
--- a/source/tests/pd/test_training.py
+++ b/source/tests/pd/test_training.py
@@ -236,5 +236,122 @@ def tearDown(self) -> None:
         DPTrainTest.tearDown(self)
 
 
+class TestModelChangeOutBiasFittingStat(unittest.TestCase):
+    """Verify model_change_out_bias produces the same fitting stat as the old code path.
+
+    The old code called compute_fitting_input_stat inside change_out_bias (make_model.py).
+    The new code calls get_fitting_net().compute_input_stats() separately in
+    model_change_out_bias (training.py). This test verifies they produce identical
+    out_bias, fparam_avg, and fparam_inv_std.
+    """
+
+    def test_fitting_stat_consistency(self) -> None:
+        from deepmd.pd.model.model import get_model as get_model_pd
+        from deepmd.pd.model.model.ener_model import EnergyModel as EnergyModelPD
+        from deepmd.pd.train.training import (
+            model_change_out_bias,
+        )
+        from deepmd.pd.utils.utils import to_numpy_array as paddle_to_numpy
+        from deepmd.pd.utils.utils import to_paddle_tensor as numpy_to_paddle
+        from deepmd.utils.argcheck import model_args as model_args_fn
+
+        # Build a model with numb_fparam=2 so fitting stat is non-trivial
+        model_params = model_args_fn().normalize_value(
+            {
+                "type_map": ["O", "H"],
+                "descriptor": {
+                    "type": "se_e2_a",
+                    "sel": [20, 20],
+                    "rcut_smth": 0.50,
+                    "rcut": 6.00,
+                    "neuron": [3, 6],
+                    "resnet_dt": False,
+                    "axis_neuron": 2,
+                    "precision": "float64",
+                    "type_one_side": True,
+                    "seed": 1,
+                },
+                "fitting_net": {
+                    "neuron": [5, 5],
+                    "resnet_dt": True,
+                    "precision": "float64",
+                    "seed": 1,
+                    "numb_fparam": 2,
+                },
+            },
+            trim_pattern="_*",
+        )
+
+        # Create two identical models via serialize/deserialize
+        model_orig = get_model_pd(model_params)
+        serialized = model_orig.serialize()
+        model_a = EnergyModelPD.deserialize(deepcopy(serialized))
+        model_b = EnergyModelPD.deserialize(deepcopy(serialized))
+
+        # Build mock stat data with fparam
+        nframes = 4
+        natoms = 6
+        coords = np.random.default_rng(42).random((nframes, natoms, 3)) * 13.0
+        atype = np.array([[0, 0, 1, 1, 1, 1]] * nframes, dtype=np.int32)
+        box = np.tile(
+            np.eye(3, dtype=np.float64).reshape(1, 3, 3) * 13.0, (nframes, 1, 1)
+        )
+        natoms_data = np.array([[6, 6, 2, 4]] * nframes, dtype=np.int32)
+        energy = np.array([10.0, 20.0, 15.0, 25.0]).reshape(nframes, 1)
+        # fparam with varying values so mean != 0 and std != 0
+        fparam = np.array(
+            [[1.0, 3.0], [5.0, 7.0], [2.0, 8.0], [6.0, 4.0]], dtype=np.float64
+        )
+
+        merged = [
+            {
+                "coord": numpy_to_paddle(coords),
+                "atype": numpy_to_paddle(atype),
+                "atype_ext": numpy_to_paddle(atype),
+                "box": numpy_to_paddle(box),
+                "natoms": numpy_to_paddle(natoms_data),
+                "energy": numpy_to_paddle(energy),
+                "find_energy": np.float32(1.0),
+                "fparam": numpy_to_paddle(fparam),
+                "find_fparam": np.float32(1.0),
+            }
+        ]
+
+        # Model A: simulate the OLD code path
+        # old change_out_bias called both bias adjustment + compute_fitting_input_stat
+        model_a.change_out_bias(merged, bias_adjust_mode="set-by-statistic")
+        model_a.atomic_model.compute_fitting_input_stat(merged)
+
+        # Model B: use the NEW code path via model_change_out_bias
+        sample_func = lambda: merged  # noqa: E731
+        model_change_out_bias(model_b, sample_func, "set-by-statistic")
+
+        # Compare out_bias
+        bias_a = paddle_to_numpy(model_a.get_out_bias())
+        bias_b = paddle_to_numpy(model_b.get_out_bias())
+        np.testing.assert_allclose(bias_a, bias_b, rtol=1e-10, atol=1e-10)
+
+        # Compare fparam_avg and fparam_inv_std
+        fit_a = model_a.get_fitting_net()
+        fit_b = model_b.get_fitting_net()
+        fparam_avg_a = paddle_to_numpy(fit_a.fparam_avg)
+        fparam_avg_b = paddle_to_numpy(fit_b.fparam_avg)
+        fparam_inv_std_a = paddle_to_numpy(fit_a.fparam_inv_std)
+        fparam_inv_std_b = paddle_to_numpy(fit_b.fparam_inv_std)
+
+        np.testing.assert_allclose(fparam_avg_a, fparam_avg_b, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(
+            fparam_inv_std_a, fparam_inv_std_b, rtol=1e-10, atol=1e-10
+        )
+
+        # Verify non-trivial: avg should not be zeros, inv_std should not be ones
+        assert not np.allclose(fparam_avg_a, 0.0), (
+            "fparam_avg is still zero — stat was not computed"
+        )
+        assert not np.allclose(fparam_inv_std_a, 1.0), (
+            "fparam_inv_std is still ones — stat was not computed"
+        )
+
+
 if __name__ == "__main__":
     unittest.main()

From 0ec574876ab7032a996c52fee5bb8d1e80faec55 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 12:46:05 +0800
Subject: [PATCH 36/63] update test for change out bias

---
 deepmd/dpmodel/model/make_model.py            |  2 -
 source/tests/consistent/model/test_dipole.py  | 76 +------------------
 source/tests/consistent/model/test_dos.py     | 76 +------------------
 source/tests/consistent/model/test_ener.py    | 76 ++-----------------
 source/tests/consistent/model/test_polar.py   | 76 +------------------
 .../tests/consistent/model/test_property.py   | 76 +------------------
 .../tests/consistent/model/test_zbl_ener.py   | 54 +++++++------
 7 files changed, 53 insertions(+), 383 deletions(-)

diff --git a/deepmd/dpmodel/model/make_model.py b/deepmd/dpmodel/model/make_model.py
index c427a8e904..f06451b3fa 100644
--- a/deepmd/dpmodel/model/make_model.py
+++ b/deepmd/dpmodel/model/make_model.py
@@ -417,8 +417,6 @@ def change_out_bias(
                 'change-by-statistic' or 'set-by-statistic'.
             """
             self.atomic_model.change_out_bias(merged, bias_adjust_mode=bias_adjust_mode)
-            if bias_adjust_mode == "set-by-statistic":
-                self.atomic_model.compute_fitting_input_stat(merged)
 
         def _input_type_cast(
             self,
diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index b75101228d..bc4047345e 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -720,10 +720,11 @@ def _get_fitting_stats(self, model, backend="dp"):
             }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
-        Note: DipoleModel's apply_out_stat is a no-op, so bias doesn't affect output,
-        but the bias storage and fitting input stats should still be consistent.
+        Tests both set-by-statistic and change-by-statistic modes.
+        Note: change_out_bias only updates the output bias, not fitting input
+        stats (fparam/aparam). Fitting stats are updated by compute_or_load_stat.
         """
         nframes = 2
         nloc = 6
@@ -775,9 +776,6 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # Save initial fitting stats (all zeros / ones)
-        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
-
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
@@ -795,40 +793,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
-        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
-            )
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
-            )
-        # Verify fparam/aparam stats actually changed from initial values
-        self.assertFalse(
-            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
-            "set-by-statistic did not update fparam_avg",
-        )
-        self.assertFalse(
-            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
-            "set-by-statistic did not update aparam_avg",
-        )
-
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
@@ -844,38 +808,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
-        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_chg[stat_key],
-                dp_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pt_stats_chg[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pe_stats_chg[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
-            )
-
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 125ba2a5fe..5ca8f193ab 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -704,10 +704,11 @@ def _get_fitting_stats(self, model, backend="dp"):
             }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
-        DOSModel uses default apply_out_stat (per-atom type bias),
-        so set-by-statistic should change the bias from initial values.
+        Tests both set-by-statistic and change-by-statistic modes.
+        Note: change_out_bias only updates the output bias, not fitting input
+        stats (fparam/aparam). Fitting stats are updated by compute_or_load_stat.
         """
         nframes = 2
         nloc = 6
@@ -759,9 +760,6 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # Save initial fitting stats (all zeros / ones)
-        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
-
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
@@ -779,40 +777,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
-        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
-            )
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
-            )
-        # Verify fparam/aparam stats actually changed from initial values
-        self.assertFalse(
-            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
-            "set-by-statistic did not update fparam_avg",
-        )
-        self.assertFalse(
-            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
-            "set-by-statistic did not update aparam_avg",
-        )
-
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
@@ -828,38 +792,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
-        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_chg[stat_key],
-                dp_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pt_stats_chg[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pe_stats_chg[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
-            )
-
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 88e34633e2..5bcdc0a7c0 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1017,7 +1017,12 @@ def _get_fitting_stats(self, model, backend="dp"):
             }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt."""
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
+
+        Tests both set-by-statistic and change-by-statistic modes.
+        Note: change_out_bias only updates the output bias, not fitting input
+        stats (fparam/aparam). Fitting stats are updated by compute_or_load_stat.
+        """
         nframes = 2
         nloc = 6
         numb_fparam = 2
@@ -1068,9 +1073,6 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # Save initial fitting stats (all zeros / ones)
-        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
-
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
@@ -1092,40 +1094,6 @@ def test_change_out_bias(self) -> None:
             "set-by-statistic did not change the bias from initial values",
         )
 
-        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
-        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
-            )
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
-            )
-        # Verify fparam/aparam stats actually changed from initial values
-        self.assertFalse(
-            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
-            "set-by-statistic did not update fparam_avg",
-        )
-        self.assertFalse(
-            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
-            "set-by-statistic did not update aparam_avg",
-        )
-
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
@@ -1145,38 +1113,6 @@ def test_change_out_bias(self) -> None:
             "change-by-statistic did not further change the bias",
         )
 
-        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
-        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_chg[stat_key],
-                dp_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pt_stats_chg[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pe_stats_chg[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
-            )
-
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 46162a39e9..902abdd722 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -714,10 +714,11 @@ def _get_fitting_stats(self, model, backend="dp"):
             }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
-        PolarModel's apply_out_stat applies diagonal bias with scale,
-        so set-by-statistic should change the bias from initial values.
+        Tests both set-by-statistic and change-by-statistic modes.
+        Note: change_out_bias only updates the output bias, not fitting input
+        stats (fparam/aparam). Fitting stats are updated by compute_or_load_stat.
         """
         nframes = 2
         nloc = 6
@@ -769,9 +770,6 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # Save initial fitting stats (all zeros / ones)
-        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
-
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
@@ -789,40 +787,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
-        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
-            )
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
-            )
-        # Verify fparam/aparam stats actually changed from initial values
-        self.assertFalse(
-            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
-            "set-by-statistic did not update fparam_avg",
-        )
-        self.assertFalse(
-            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
-            "set-by-statistic did not update aparam_avg",
-        )
-
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
@@ -838,38 +802,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
-        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_chg[stat_key],
-                dp_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pt_stats_chg[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pe_stats_chg[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
-            )
-
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 47d90eae4b..952642f383 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -701,10 +701,11 @@ def _get_fitting_stats(self, model, backend="dp"):
             }
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias should produce consistent bias and fitting stats on dp, pt, and pt_expt.
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
-        PropertyModel's apply_out_stat applies output * std + bias,
-        so set-by-statistic should change the bias from initial values.
+        Tests both set-by-statistic and change-by-statistic modes.
+        Note: change_out_bias only updates the output bias, not fitting input
+        stats (fparam/aparam). Fitting stats are updated by compute_or_load_stat.
         """
         nframes = 2
         nloc = 6
@@ -756,9 +757,6 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # Save initial fitting stats (all zeros / ones)
-        dp_stats_init = self._get_fitting_stats(self.dp_model, "dp")
-
         # Save initial (zero) bias
         dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
@@ -776,40 +774,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats were updated (set-by-statistic triggers compute_fitting_input_stat)
-        dp_stats_set = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_set = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_set = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt {stat_key} mismatch after set-by-statistic",
-            )
-            np.testing.assert_allclose(
-                dp_stats_set[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp vs pt_expt {stat_key} mismatch after set-by-statistic",
-            )
-        # Verify fparam/aparam stats actually changed from initial values
-        self.assertFalse(
-            np.allclose(dp_stats_set["fparam_avg"], dp_stats_init["fparam_avg"]),
-            "set-by-statistic did not update fparam_avg",
-        )
-        self.assertFalse(
-            np.allclose(dp_stats_set["aparam_avg"], dp_stats_init["aparam_avg"]),
-            "set-by-statistic did not update aparam_avg",
-        )
-
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
@@ -825,38 +789,6 @@ def test_change_out_bias(self) -> None:
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
 
-        # Verify fitting input stats did NOT change (change-by-statistic should not recompute them)
-        dp_stats_chg = self._get_fitting_stats(self.dp_model, "dp")
-        pt_stats_chg = self._get_fitting_stats(self.pt_model, "pt")
-        pe_stats_chg = self._get_fitting_stats(self.pt_expt_model, "dp")
-        for stat_key in (
-            "fparam_avg",
-            "fparam_inv_std",
-            "aparam_avg",
-            "aparam_inv_std",
-        ):
-            np.testing.assert_allclose(
-                dp_stats_chg[stat_key],
-                dp_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"dp {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pt_stats_chg[stat_key],
-                pt_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt {stat_key} changed after change-by-statistic (should not)",
-            )
-            np.testing.assert_allclose(
-                pe_stats_chg[stat_key],
-                pe_stats_set[stat_key],
-                rtol=1e-10,
-                atol=1e-10,
-                err_msg=f"pt_expt {stat_key} changed after change-by-statistic (should not)",
-            )
-
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
 
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index 3d4327a7db..e7e0eb8a27 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -697,15 +697,12 @@ def test_forward_common_atomic(self) -> None:
                 )
 
     def test_change_out_bias(self) -> None:
-        """change_out_bias (change-by-statistic) should produce consistent bias on dp, pt, and pt_expt.
+        """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
-        DPZBLModel (LinearEnergyAtomicModel) does not support set-by-statistic
-        (no compute_fitting_input_stat), so only change-by-statistic is tested.
-        We first compute initial bias via compute_or_load_out_stat, then verify
-        change-by-statistic updates bias consistently.
+        Tests both set-by-statistic and change-by-statistic modes.
+        DPZBLModel has no fparam/aparam, so fitting stats checks are skipped.
         """
         nframes = 2
-        rng = np.random.default_rng(123)
 
         # Use realistic coords (from setUp, tiled for 2 frames)
         coords_2f = np.tile(self.coords, (nframes, 1, 1))  # (2, 6, 3)
@@ -713,7 +710,7 @@ def test_change_out_bias(self) -> None:
         box_2f = np.tile(self.box.reshape(1, 3, 3), (nframes, 1, 1))
         # natoms: [nloc, nloc, n_type0, n_type1, n_type2] — 3 types
         natoms_data = np.array([[6, 6, 2, 4, 0], [6, 6, 2, 4, 0]], dtype=np.int32)
-        energy_data = rng.normal(size=(nframes, 1)).astype(GLOBAL_NP_FLOAT_PRECISION)
+        energy_data = np.array([10.0, 20.0]).reshape(nframes, 1)
 
         # dpmodel stat data (numpy)
         dp_merged = [
@@ -742,22 +739,29 @@ def test_change_out_bias(self) -> None:
         # pt_expt stat data (numpy, same as dp)
         pe_merged = dp_merged
 
-        # First compute initial bias via compute_or_load_out_stat
-        self.dp_model.atomic_model.compute_or_load_out_stat(dp_merged)
-        self.pt_model.atomic_model.compute_or_load_out_stat(pt_merged)
-        self.pt_expt_model.atomic_model.compute_or_load_out_stat(dp_merged)
+        # Save initial (zero) bias
+        dp_bias_init = to_numpy_array(self.dp_model.get_out_bias()).copy()
 
-        dp_bias_before = to_numpy_array(self.dp_model.get_out_bias()).copy()
-        pt_bias_before = torch_to_numpy(self.pt_model.get_out_bias()).copy()
-        pe_bias_before = to_numpy_array(self.pt_expt_model.get_out_bias()).copy()
-        np.testing.assert_allclose(
-            dp_bias_before, pt_bias_before, rtol=1e-10, atol=1e-10
+        # --- Test "set-by-statistic" mode ---
+        self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="set-by-statistic")
+        self.pt_expt_model.change_out_bias(
+            pe_merged, bias_adjust_mode="set-by-statistic"
         )
-        np.testing.assert_allclose(
-            dp_bias_before, pe_bias_before, rtol=1e-10, atol=1e-10
+
+        # Verify out bias consistency
+        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias, dp_bias_init),
+            "set-by-statistic did not change the bias from initial values",
         )
 
         # --- Test "change-by-statistic" mode ---
+        dp_bias_before = dp_bias.copy()
         self.dp_model.change_out_bias(dp_merged, bias_adjust_mode="change-by-statistic")
         self.pt_model.change_out_bias(pt_merged, bias_adjust_mode="change-by-statistic")
         self.pt_expt_model.change_out_bias(
@@ -765,11 +769,15 @@ def test_change_out_bias(self) -> None:
         )
 
         # Verify out bias consistency
-        dp_bias = to_numpy_array(self.dp_model.get_out_bias())
-        pt_bias = torch_to_numpy(self.pt_model.get_out_bias())
-        pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
-        np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
-        np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        dp_bias2 = to_numpy_array(self.dp_model.get_out_bias())
+        pt_bias2 = torch_to_numpy(self.pt_model.get_out_bias())
+        pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
+        np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
+        np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias2, dp_bias_before),
+            "change-by-statistic did not further change the bias",
+        )
 
     # test_change_type_map: NOT applicable — PairTabAtomicModel does not
     # support changing type map (would require rebuilding the tab file),

From 00f83cc4682cabc5b52f8f0196e3dd16f82221c9 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 16:23:39 +0800
Subject: [PATCH 37/63] test the stat is changed

---
 source/tests/consistent/model/test_dipole.py   | 8 ++++++++
 source/tests/consistent/model/test_dos.py      | 8 ++++++++
 source/tests/consistent/model/test_polar.py    | 8 ++++++++
 source/tests/consistent/model/test_property.py | 8 ++++++++
 4 files changed, 32 insertions(+)

diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index bc4047345e..6742dd7f69 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -792,6 +792,10 @@ def test_change_out_bias(self) -> None:
         pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias, dp_bias_init),
+            "set-by-statistic did not change the bias from initial values",
+        )
 
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
@@ -807,6 +811,10 @@ def test_change_out_bias(self) -> None:
         pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias2, dp_bias_before),
+            "change-by-statistic did not further change the bias",
+        )
 
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 5ca8f193ab..5cb7d722c8 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -776,6 +776,10 @@ def test_change_out_bias(self) -> None:
         pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias, dp_bias_init),
+            "set-by-statistic did not change the bias from initial values",
+        )
 
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
@@ -791,6 +795,10 @@ def test_change_out_bias(self) -> None:
         pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias2, dp_bias_before),
+            "change-by-statistic did not further change the bias",
+        )
 
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 902abdd722..cba3147c53 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -786,6 +786,10 @@ def test_change_out_bias(self) -> None:
         pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias, dp_bias_init),
+            "set-by-statistic did not change the bias from initial values",
+        )
 
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
@@ -801,6 +805,10 @@ def test_change_out_bias(self) -> None:
         pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias2, dp_bias_before),
+            "change-by-statistic did not further change the bias",
+        )
 
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 952642f383..65a9d50cc1 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -773,6 +773,10 @@ def test_change_out_bias(self) -> None:
         pe_bias = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias, pt_bias, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias, pe_bias, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias, dp_bias_init),
+            "set-by-statistic did not change the bias from initial values",
+        )
 
         # --- Test "change-by-statistic" mode ---
         dp_bias_before = dp_bias.copy()
@@ -788,6 +792,10 @@ def test_change_out_bias(self) -> None:
         pe_bias2 = to_numpy_array(self.pt_expt_model.get_out_bias())
         np.testing.assert_allclose(dp_bias2, pt_bias2, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_bias2, pe_bias2, rtol=1e-10, atol=1e-10)
+        self.assertFalse(
+            np.allclose(dp_bias2, dp_bias_before),
+            "change-by-statistic did not further change the bias",
+        )
 
     def test_change_type_map(self) -> None:
         """change_type_map should produce consistent results on dp and pt.

From ff4a27c066a61dfb003177641d45d8f95b1a040f Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 16:28:49 +0800
Subject: [PATCH 38/63] rm unused methods

---
 source/tests/consistent/model/test_dipole.py   | 18 ------------------
 source/tests/consistent/model/test_dos.py      | 18 ------------------
 source/tests/consistent/model/test_ener.py     | 18 ------------------
 source/tests/consistent/model/test_polar.py    | 18 ------------------
 source/tests/consistent/model/test_property.py | 18 ------------------
 5 files changed, 90 deletions(-)

diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index 6742dd7f69..c6c2f01697 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -701,24 +701,6 @@ def test_get_default_fparam(self) -> None:
         np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
 
-    def _get_fitting_stats(self, model, backend="dp"):
-        """Extract fparam/aparam stats from a model's fitting net."""
-        fitting = model.get_fitting_net()
-        if backend == "pt":
-            return {
-                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
-                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
-                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
-                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
-            }
-        else:
-            return {
-                "fparam_avg": to_numpy_array(fitting.fparam_avg),
-                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
-                "aparam_avg": to_numpy_array(fitting.aparam_avg),
-                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
-            }
-
     def test_change_out_bias(self) -> None:
         """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 5cb7d722c8..2068274183 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -685,24 +685,6 @@ def test_get_default_fparam(self) -> None:
         np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
 
-    def _get_fitting_stats(self, model, backend="dp"):
-        """Extract fparam/aparam stats from a model's fitting net."""
-        fitting = model.get_fitting_net()
-        if backend == "pt":
-            return {
-                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
-                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
-                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
-                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
-            }
-        else:
-            return {
-                "fparam_avg": to_numpy_array(fitting.fparam_avg),
-                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
-                "aparam_avg": to_numpy_array(fitting.aparam_avg),
-                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
-            }
-
     def test_change_out_bias(self) -> None:
         """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 5bcdc0a7c0..abdbe5fe1c 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -998,24 +998,6 @@ def test_get_default_fparam(self) -> None:
         np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
 
-    def _get_fitting_stats(self, model, backend="dp"):
-        """Extract fparam/aparam stats from a model's fitting net."""
-        fitting = model.get_fitting_net()
-        if backend == "pt":
-            return {
-                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
-                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
-                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
-                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
-            }
-        else:
-            return {
-                "fparam_avg": to_numpy_array(fitting.fparam_avg),
-                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
-                "aparam_avg": to_numpy_array(fitting.aparam_avg),
-                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
-            }
-
     def test_change_out_bias(self) -> None:
         """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index cba3147c53..7bbd5ce8b5 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -695,24 +695,6 @@ def test_get_default_fparam(self) -> None:
         np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
 
-    def _get_fitting_stats(self, model, backend="dp"):
-        """Extract fparam/aparam stats from a model's fitting net."""
-        fitting = model.get_fitting_net()
-        if backend == "pt":
-            return {
-                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
-                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
-                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
-                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
-            }
-        else:
-            return {
-                "fparam_avg": to_numpy_array(fitting.fparam_avg),
-                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
-                "aparam_avg": to_numpy_array(fitting.aparam_avg),
-                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
-            }
-
     def test_change_out_bias(self) -> None:
         """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 65a9d50cc1..77118af210 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -682,24 +682,6 @@ def test_get_default_fparam(self) -> None:
         np.testing.assert_allclose(dp_val, pt_val, rtol=1e-10, atol=1e-10)
         np.testing.assert_allclose(dp_val, [0.5, -0.3], rtol=1e-10, atol=1e-10)
 
-    def _get_fitting_stats(self, model, backend="dp"):
-        """Extract fparam/aparam stats from a model's fitting net."""
-        fitting = model.get_fitting_net()
-        if backend == "pt":
-            return {
-                "fparam_avg": torch_to_numpy(fitting.fparam_avg),
-                "fparam_inv_std": torch_to_numpy(fitting.fparam_inv_std),
-                "aparam_avg": torch_to_numpy(fitting.aparam_avg),
-                "aparam_inv_std": torch_to_numpy(fitting.aparam_inv_std),
-            }
-        else:
-            return {
-                "fparam_avg": to_numpy_array(fitting.fparam_avg),
-                "fparam_inv_std": to_numpy_array(fitting.fparam_inv_std),
-                "aparam_avg": to_numpy_array(fitting.aparam_avg),
-                "aparam_inv_std": to_numpy_array(fitting.aparam_inv_std),
-            }
-
     def test_change_out_bias(self) -> None:
         """change_out_bias should produce consistent bias on dp, pt, and pt_expt.
 

From 15f2af8abf24cbbaeffe3a7c7647852d11efe3a3 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Wed, 25 Feb 2026 16:30:56 +0800
Subject: [PATCH 39/63] use deep copy

---
 source/tests/consistent/model/test_ener.py | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index 5bcdc0a7c0..cc4c90c250 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1766,9 +1766,15 @@ def test_compute_stat(self) -> None:
             )
 
         # 2. Run compute_or_load_stat on all three backends
-        self.dp_model.compute_or_load_stat(lambda: self.np_sampled)
-        self.pt_model.compute_or_load_stat(lambda: self.pt_sampled)
-        self.pt_expt_model.compute_or_load_stat(lambda: self.np_sampled)
+        # deepcopy because stat.py mutates natoms in-place when atom_exclude_types
+        # is non-empty (natoms[:, 2:] *= type_mask).
+        from copy import (
+            deepcopy,
+        )
+
+        self.dp_model.compute_or_load_stat(lambda: deepcopy(self.np_sampled))
+        self.pt_model.compute_or_load_stat(lambda: deepcopy(self.pt_sampled))
+        self.pt_expt_model.compute_or_load_stat(lambda: deepcopy(self.np_sampled))
 
         # 3. Serialize all three and compare @variables
         dp_ser = self.dp_model.serialize()

From 45403823294203cfd99ab9a7819d566c4458230a Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 09:39:40 +0800
Subject: [PATCH 40/63] Extracted compare_variables_recursive to
 source/tests/consistent/model/common.py

---
 source/tests/consistent/model/common.py       | 30 +++++++++++++
 source/tests/consistent/model/test_dipole.py  | 43 ++++---------------
 source/tests/consistent/model/test_dos.py     | 43 ++++---------------
 source/tests/consistent/model/test_ener.py    | 43 ++++---------------
 source/tests/consistent/model/test_polar.py   | 43 ++++---------------
 .../tests/consistent/model/test_property.py   | 43 ++++---------------
 .../tests/consistent/model/test_zbl_ener.py   | 43 ++++---------------
 7 files changed, 78 insertions(+), 210 deletions(-)

diff --git a/source/tests/consistent/model/common.py b/source/tests/consistent/model/common.py
index 04966c02a1..3dff24dcba 100644
--- a/source/tests/consistent/model/common.py
+++ b/source/tests/consistent/model/common.py
@@ -3,6 +3,8 @@
     Any,
 )
 
+import numpy as np
+
 from deepmd.common import (
     make_default_mesh,
 )
@@ -145,3 +147,31 @@ def eval_pd_model(self, pd_obj: Any, natoms, coords, atype, box) -> Any:
                 do_atomic_virial=True,
             ).items()
         }
+
+
+def compare_variables_recursive(
+    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
+) -> None:
+    """Recursively compare ``@variables`` sections in two serialized dicts."""
+    for key in d1:
+        if key not in d2:
+            continue
+        child_path = f"{path}/{key}" if path else key
+        v1, v2 = d1[key], d2[key]
+        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
+            for vk in v1:
+                if vk not in v2:
+                    continue
+                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
+                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
+                if a1 is None and a2 is None:
+                    continue
+                np.testing.assert_allclose(
+                    a1,
+                    a2,
+                    rtol=rtol,
+                    atol=atol,
+                    err_msg=f"@variables mismatch at {child_path}/{vk}",
+                )
+        elif isinstance(v1, dict) and isinstance(v2, dict):
+            compare_variables_recursive(v1, v2, child_path, rtol, atol)
diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index c6c2f01697..76251af6d2 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -32,6 +32,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1223,34 +1224,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
     (False, True),  # fparam_in_data
@@ -1466,8 +1439,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         # Note: DipoleModel's apply_out_stat is a no-op, so output won't change
@@ -1573,10 +1546,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
diff --git a/source/tests/consistent/model/test_dos.py b/source/tests/consistent/model/test_dos.py
index 2068274183..5f801129d4 100644
--- a/source/tests/consistent/model/test_dos.py
+++ b/source/tests/consistent/model/test_dos.py
@@ -32,6 +32,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1212,34 +1213,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
     (False, True),  # fparam_in_data
@@ -1456,8 +1429,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         # DOSModel uses default apply_out_stat (per-atom type bias), so
@@ -1563,10 +1536,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index b6d1b4c90b..f47365e2cf 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -34,6 +34,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1514,34 +1515,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
     (False, True),  # fparam_in_data
@@ -1762,8 +1735,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         dp_ret1 = self._eval_dp()
@@ -1867,10 +1840,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 7bbd5ce8b5..93e696596e 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -32,6 +32,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1217,34 +1218,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
     (False, True),  # fparam_in_data
@@ -1460,8 +1433,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         # PolarModel's apply_out_stat applies diagonal bias with scale, so
@@ -1567,10 +1540,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
diff --git a/source/tests/consistent/model/test_property.py b/source/tests/consistent/model/test_property.py
index 77118af210..cf4f7f1de9 100644
--- a/source/tests/consistent/model/test_property.py
+++ b/source/tests/consistent/model/test_property.py
@@ -31,6 +31,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1209,34 +1210,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O", "H"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
     (False, True),  # fparam_in_data
@@ -1453,8 +1426,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         # PropertyModel's apply_out_stat applies output * std + bias, so
@@ -1560,10 +1533,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
diff --git a/source/tests/consistent/model/test_zbl_ener.py b/source/tests/consistent/model/test_zbl_ener.py
index e7e0eb8a27..0cf907bee2 100644
--- a/source/tests/consistent/model/test_zbl_ener.py
+++ b/source/tests/consistent/model/test_zbl_ener.py
@@ -34,6 +34,7 @@
 )
 from .common import (
     ModelTest,
+    compare_variables_recursive,
 )
 
 if INSTALLED_PT:
@@ -1017,34 +1018,6 @@ def test_get_observed_type_list(self) -> None:
         self.assertEqual(dp_observed, ["O"])
 
 
-def _compare_variables_recursive(
-    d1: dict, d2: dict, path: str = "", rtol: float = 1e-10, atol: float = 1e-10
-) -> None:
-    """Recursively compare ``@variables`` sections in two serialized dicts."""
-    for key in d1:
-        if key not in d2:
-            continue
-        child_path = f"{path}/{key}" if path else key
-        v1, v2 = d1[key], d2[key]
-        if key == "@variables" and isinstance(v1, dict) and isinstance(v2, dict):
-            for vk in v1:
-                if vk not in v2:
-                    continue
-                a1 = np.asarray(v1[vk]) if v1[vk] is not None else None
-                a2 = np.asarray(v2[vk]) if v2[vk] is not None else None
-                if a1 is None and a2 is None:
-                    continue
-                np.testing.assert_allclose(
-                    a1,
-                    a2,
-                    rtol=rtol,
-                    atol=atol,
-                    err_msg=f"@variables mismatch at {child_path}/{vk}",
-                )
-        elif isinstance(v1, dict) and isinstance(v2, dict):
-            _compare_variables_recursive(v1, v2, child_path, rtol, atol)
-
-
 @parameterized(
     (([], []), ([[0, 1]], [1])),  # (pair_exclude_types, atom_exclude_types)
 )
@@ -1237,8 +1210,8 @@ def test_compute_stat(self) -> None:
         dp_ser = self.dp_model.serialize()
         pt_ser = self.pt_model.serialize()
         pe_ser = self.pt_expt_model.serialize()
-        _compare_variables_recursive(dp_ser, pt_ser)
-        _compare_variables_recursive(dp_ser, pe_ser)
+        compare_variables_recursive(dp_ser, pt_ser)
+        compare_variables_recursive(dp_ser, pe_ser)
 
         # 4. Post-stat forward consistency
         dp_ret1 = self._eval_dp()
@@ -1323,10 +1296,10 @@ def raise_error():
             dp_ser_loaded = dp_model2.serialize()
             pt_ser_loaded = pt_model2.serialize()
             pe_ser_loaded = pe_model2.serialize()
-            _compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
-            _compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
-            _compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_computed, dp_ser_loaded)
+            compare_variables_recursive(pt_ser_computed, pt_ser_loaded)
+            compare_variables_recursive(pe_ser_computed, pe_ser_loaded)
 
             # 5. Cross-backend consistency after loading
-            _compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
-            _compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pt_ser_loaded)
+            compare_variables_recursive(dp_ser_loaded, pe_ser_loaded)

From 9427d25d1cd7c626bb6d430150e0e9de6c3e40af Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 11:49:46 +0800
Subject: [PATCH 41/63] fix: remove dead code and redundant assignments in
 dpmodel atomic models

  Remove unused  parameter from PairTabAtomicModel and
  redundant  assignments already handled by BaseAtomicModel.__init__.
---
 deepmd/dpmodel/atomic_model/dp_atomic_model.py      | 1 -
 deepmd/dpmodel/atomic_model/pairtab_atomic_model.py | 4 ----
 2 files changed, 5 deletions(-)

diff --git a/deepmd/dpmodel/atomic_model/dp_atomic_model.py b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
index a02536b18b..cdbba4b40e 100644
--- a/deepmd/dpmodel/atomic_model/dp_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/dp_atomic_model.py
@@ -54,7 +54,6 @@ def __init__(
         **kwargs: Any,
     ) -> None:
         super().__init__(type_map, **kwargs)
-        self.type_map = type_map
         self.descriptor = descriptor
         self.fitting_net = fitting
         if hasattr(self.fitting_net, "reinit_exclude"):
diff --git a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
index 11156e9f93..39797e0532 100644
--- a/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/pairtab_atomic_model.py
@@ -71,20 +71,16 @@ def __init__(
         sel: int | list[int],
         type_map: list[str],
         rcond: float | None = None,
-        atom_ener: list[float] | None = None,
         **kwargs: Any,
     ) -> None:
         super().__init__(type_map, **kwargs)
         super().init_out_stat()
         self.tab_file = tab_file
         self.rcut = rcut
-        self.type_map = type_map
 
         self.tab = PairTab(self.tab_file, rcut=rcut)
-        self.type_map = type_map
         self.ntypes = len(type_map)
         self.rcond = rcond
-        self.atom_ener = atom_ener
 
         if self.tab_file is not None:
             tab_info, tab_data = self.tab.get()

From 4af1245e5bb84f65121c6b7f392f336633907300 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 16:07:33 +0800
Subject: [PATCH 42/63] feat(pt_expt): add training infrastructure using
 DeepmdDataSystem

  Add training support to the pt_expt backend. The training loop uses
  DeepmdDataSystem (numpy batch provider) instead of pt's DpLoaderSet,
  converting numpy batches to torch tensors at the boundary.

  New files:
  - train/training.py: Trainer class (single-task, single-GPU)
  - train/wrapper.py: ModelWrapper wrapping model + loss
  - utils/stat.py: make_stat_input adaptor for DeepmdDataSystem
  - model/get_model.py: model factory using pt_expt registries
  - entrypoints/main.py: CLI entrypoint (dp --pt-expt train)

  Also fixes:
  - Use object.__new__(cls) in make_base_descriptor/fitting/model
    __new__ to avoid TypeError when pt_expt classes (which inherit
    from dpmodel's BD, not pt_expt's BD) are resolved via the registry.
  - Point pt_expt backend entry_point_hook to its own main, and fix
    backend name to PyTorch-Exportable so lowered name matches
    the registered alias.
---
 deepmd/backend/pt_expt.py                     |   4 +-
 .../descriptor/make_base_descriptor.py        |   2 +-
 deepmd/dpmodel/fitting/make_base_fitting.py   |   2 +-
 deepmd/dpmodel/model/base_model.py            |   2 +-
 deepmd/pt_expt/entrypoints/__init__.py        |   1 +
 deepmd/pt_expt/entrypoints/main.py            | 201 +++++++
 deepmd/pt_expt/model/__init__.py              |   4 +
 deepmd/pt_expt/model/get_model.py             | 119 +++++
 deepmd/pt_expt/train/__init__.py              |   1 +
 deepmd/pt_expt/train/training.py              | 502 ++++++++++++++++++
 deepmd/pt_expt/train/wrapper.py               |  85 +++
 deepmd/pt_expt/utils/stat.py                  |  85 +++
 source/tests/pt_expt/test_training.py         | 212 ++++++++
 13 files changed, 1215 insertions(+), 5 deletions(-)
 create mode 100644 deepmd/pt_expt/entrypoints/__init__.py
 create mode 100644 deepmd/pt_expt/entrypoints/main.py
 create mode 100644 deepmd/pt_expt/model/get_model.py
 create mode 100644 deepmd/pt_expt/train/__init__.py
 create mode 100644 deepmd/pt_expt/train/training.py
 create mode 100644 deepmd/pt_expt/train/wrapper.py
 create mode 100644 deepmd/pt_expt/utils/stat.py
 create mode 100644 source/tests/pt_expt/test_training.py

diff --git a/deepmd/backend/pt_expt.py b/deepmd/backend/pt_expt.py
index ade9eb51f3..61a7151208 100644
--- a/deepmd/backend/pt_expt.py
+++ b/deepmd/backend/pt_expt.py
@@ -32,7 +32,7 @@
 class PyTorchExportableBackend(Backend):
     """PyTorch exportable backend."""
 
-    name = "PyTorch Exportable"
+    name = "PyTorch-Exportable"
     """The formal name of the backend."""
     features: ClassVar[Backend.Feature] = (
         Backend.Feature.ENTRY_POINT
@@ -63,7 +63,7 @@ def entry_point_hook(self) -> Callable[["Namespace"], None]:
         Callable[[Namespace], None]
             The entry point hook of the backend.
         """
-        from deepmd.pt.entrypoints.main import main as deepmd_main
+        from deepmd.pt_expt.entrypoints.main import main as deepmd_main
 
         return deepmd_main
 
diff --git a/deepmd/dpmodel/descriptor/make_base_descriptor.py b/deepmd/dpmodel/descriptor/make_base_descriptor.py
index f87ca2c5b6..cfef017180 100644
--- a/deepmd/dpmodel/descriptor/make_base_descriptor.py
+++ b/deepmd/dpmodel/descriptor/make_base_descriptor.py
@@ -51,7 +51,7 @@ class BD(ABC, PluginVariant, make_plugin_registry("descriptor")):
         def __new__(cls, *args: Any, **kwargs: Any) -> Any:
             if cls is BD:
                 cls = cls.get_class_by_type(j_get_type(kwargs, cls.__name__))
-            return super().__new__(cls)
+            return object.__new__(cls)
 
         @abstractmethod
         def get_rcut(self) -> float:
diff --git a/deepmd/dpmodel/fitting/make_base_fitting.py b/deepmd/dpmodel/fitting/make_base_fitting.py
index 7b65a150b2..cf8172bd03 100644
--- a/deepmd/dpmodel/fitting/make_base_fitting.py
+++ b/deepmd/dpmodel/fitting/make_base_fitting.py
@@ -42,7 +42,7 @@ class BF(ABC, PluginVariant, make_plugin_registry("fitting")):
         def __new__(cls: type, *args: Any, **kwargs: Any) -> Any:
             if cls is BF:
                 cls = cls.get_class_by_type(j_get_type(kwargs, cls.__name__))
-            return super().__new__(cls)
+            return object.__new__(cls)
 
         @abstractmethod
         def output_def(self) -> FittingOutputDef:
diff --git a/deepmd/dpmodel/model/base_model.py b/deepmd/dpmodel/model/base_model.py
index d87c0eb5b7..b89172c4f6 100644
--- a/deepmd/dpmodel/model/base_model.py
+++ b/deepmd/dpmodel/model/base_model.py
@@ -42,7 +42,7 @@ def __new__(cls, *args: Any, **kwargs: Any) -> "BaseModel":
                 if model_type == "standard":
                     model_type = kwargs.get("fitting", {}).get("type", "ener")
                 cls = cls.get_class_by_type(model_type)
-            return super().__new__(cls)
+            return object.__new__(cls)
 
         @abstractmethod
         def __call__(self, *args: Any, **kwds: Any) -> Any:
diff --git a/deepmd/pt_expt/entrypoints/__init__.py b/deepmd/pt_expt/entrypoints/__init__.py
new file mode 100644
index 0000000000..6ceb116d85
--- /dev/null
+++ b/deepmd/pt_expt/entrypoints/__init__.py
@@ -0,0 +1 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
diff --git a/deepmd/pt_expt/entrypoints/main.py b/deepmd/pt_expt/entrypoints/main.py
new file mode 100644
index 0000000000..a0b814f07a
--- /dev/null
+++ b/deepmd/pt_expt/entrypoints/main.py
@@ -0,0 +1,201 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Training entrypoint for the pt_expt backend."""
+
+import argparse
+import json
+import logging
+from pathlib import (
+    Path,
+)
+from typing import (
+    Any,
+)
+
+import h5py
+
+from deepmd.pt_expt.train import (
+    training,
+)
+from deepmd.utils.argcheck import (
+    normalize,
+)
+from deepmd.utils.compat import (
+    update_deepmd_input,
+)
+from deepmd.utils.data_system import (
+    DeepmdDataSystem,
+    get_data,
+    process_systems,
+)
+from deepmd.utils.path import (
+    DPPath,
+)
+
+log = logging.getLogger(__name__)
+
+
+def get_trainer(
+    config: dict[str, Any],
+    init_model: str | None = None,
+    restart_model: str | None = None,
+) -> training.Trainer:
+    """Build a :class:`training.Trainer` from a normalised config."""
+    model_params = config["model"]
+    training_params = config["training"]
+    type_map = model_params["type_map"]
+
+    # ----- training data ------------------------------------------------
+    training_dataset_params = training_params["training_data"]
+    training_systems = process_systems(
+        training_dataset_params["systems"],
+        patterns=training_dataset_params.get("rglob_patterns", None),
+    )
+    train_data = DeepmdDataSystem(
+        systems=training_systems,
+        batch_size=training_dataset_params["batch_size"],
+        test_size=1,
+        type_map=type_map,
+        trn_all_set=True,
+        sys_probs=training_dataset_params.get("sys_probs", None),
+        auto_prob_style=training_dataset_params.get("auto_prob", "prob_sys_size"),
+    )
+
+    # ----- validation data ----------------------------------------------
+    validation_data = None
+    validation_dataset_params = training_params.get("validation_data", None)
+    if validation_dataset_params is not None:
+        val_systems = process_systems(
+            validation_dataset_params["systems"],
+            patterns=validation_dataset_params.get("rglob_patterns", None),
+        )
+        validation_data = DeepmdDataSystem(
+            systems=val_systems,
+            batch_size=validation_dataset_params["batch_size"],
+            test_size=1,
+            type_map=type_map,
+            trn_all_set=True,
+        )
+
+    # ----- stat file path -----------------------------------------------
+    stat_file_path = training_params.get("stat_file", None)
+    if stat_file_path is not None:
+        if not Path(stat_file_path).exists():
+            if stat_file_path.endswith((".h5", ".hdf5")):
+                with h5py.File(stat_file_path, "w"):
+                    pass
+            else:
+                Path(stat_file_path).mkdir()
+        stat_file_path = DPPath(stat_file_path, "a")
+
+    trainer = training.Trainer(
+        config,
+        train_data,
+        stat_file_path=stat_file_path,
+        validation_data=validation_data,
+        init_model=init_model,
+        restart_model=restart_model,
+    )
+    return trainer
+
+
+def train(
+    input_file: str,
+    init_model: str | None = None,
+    restart: str | None = None,
+    skip_neighbor_stat: bool = False,
+    output: str = "out.json",
+) -> None:
+    """Run training with the pt_expt backend.
+
+    Parameters
+    ----------
+    input_file : str
+        Path to the JSON configuration file.
+    init_model : str or None
+        Path to a checkpoint to initialise weights from.
+    restart : str or None
+        Path to a checkpoint to restart training from.
+    skip_neighbor_stat : bool
+        Skip neighbour statistics calculation.
+    output : str
+        Where to dump the normalised config.
+    """
+    from deepmd.common import (
+        j_loader,
+    )
+
+    log.info("Configuration path: %s", input_file)
+    config = j_loader(input_file)
+
+    # suffix fix
+    if init_model is not None and not init_model.endswith(".pt"):
+        init_model += ".pt"
+    if restart is not None and not restart.endswith(".pt"):
+        restart += ".pt"
+
+    # argcheck
+    config = update_deepmd_input(config, warning=True, dump="input_v2_compat.json")
+    config = normalize(config)
+
+    # neighbour stat
+    if not skip_neighbor_stat:
+        log.info(
+            "Calculate neighbor statistics... "
+            "(add --skip-neighbor-stat to skip this step)"
+        )
+        type_map = config["model"].get("type_map")
+        train_data = get_data(config["training"]["training_data"], 0, type_map, None)
+        from deepmd.pt_expt.model import (
+            BaseModel,
+        )
+
+        config["model"], _min_nbor_dist = BaseModel.update_sel(
+            train_data, type_map, config["model"]
+        )
+
+    with open(output, "w") as fp:
+        json.dump(config, fp, indent=4)
+
+    trainer = get_trainer(config, init_model, restart)
+    trainer.run()
+
+
+def main(args: list[str] | argparse.Namespace | None = None) -> None:
+    """Entry point for the pt_expt backend CLI.
+
+    Parameters
+    ----------
+    args : list[str] | argparse.Namespace | None
+        Command-line arguments or pre-parsed namespace.
+    """
+    from deepmd.loggers.loggers import (
+        set_log_handles,
+    )
+    from deepmd.main import (
+        parse_args,
+    )
+
+    if not isinstance(args, argparse.Namespace):
+        FLAGS = parse_args(args=args)
+    else:
+        FLAGS = args
+
+    set_log_handles(
+        FLAGS.log_level,
+        Path(FLAGS.log_path) if FLAGS.log_path else None,
+        mpi_log=None,
+    )
+    log.info("DeePMD-kit backend: pt_expt (PyTorch Exportable)")
+
+    if FLAGS.command == "train":
+        train(
+            input_file=FLAGS.INPUT,
+            init_model=FLAGS.init_model,
+            restart=FLAGS.restart,
+            skip_neighbor_stat=FLAGS.skip_neighbor_stat,
+            output=FLAGS.output,
+        )
+    else:
+        raise RuntimeError(
+            f"Unsupported command '{FLAGS.command}' for the pt_expt backend."
+        )
diff --git a/deepmd/pt_expt/model/__init__.py b/deepmd/pt_expt/model/__init__.py
index da120091e0..7b3f7cdeab 100644
--- a/deepmd/pt_expt/model/__init__.py
+++ b/deepmd/pt_expt/model/__init__.py
@@ -11,6 +11,9 @@
 from .ener_model import (
     EnergyModel,
 )
+from .get_model import (
+    get_model,
+)
 from .model import (
     BaseModel,
 )
@@ -29,4 +32,5 @@
     "EnergyModel",
     "PolarModel",
     "PropertyModel",
+    "get_model",
 ]
diff --git a/deepmd/pt_expt/model/get_model.py b/deepmd/pt_expt/model/get_model.py
new file mode 100644
index 0000000000..9d4296a50b
--- /dev/null
+++ b/deepmd/pt_expt/model/get_model.py
@@ -0,0 +1,119 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Model factory for the pt_expt backend.
+
+Mirrors ``deepmd.dpmodel.model.model`` but uses the pt_expt
+``BaseDescriptor`` / ``BaseFitting`` registries so that the
+constructed objects are ``torch.nn.Module`` subclasses.
+"""
+
+import copy
+from typing import (
+    Any,
+)
+
+from deepmd.pt_expt.descriptor import (
+    BaseDescriptor,
+)
+from deepmd.pt_expt.fitting import (
+    BaseFitting,
+)
+
+# Import from submodules directly to avoid circular import via __init__.py
+from deepmd.pt_expt.model.dipole_model import (
+    DipoleModel,
+)
+from deepmd.pt_expt.model.dos_model import (
+    DOSModel,
+)
+from deepmd.pt_expt.model.ener_model import (
+    EnergyModel,
+)
+from deepmd.pt_expt.model.model import (
+    BaseModel,
+)
+from deepmd.pt_expt.model.polar_model import (
+    PolarModel,
+)
+from deepmd.pt_expt.model.property_model import (
+    PropertyModel,
+)
+
+
+def _get_standard_model_components(
+    data: dict[str, Any],
+    ntypes: int,
+) -> tuple:
+    """Build descriptor and fitting from config dict."""
+    # descriptor
+    data["descriptor"]["ntypes"] = ntypes
+    data["descriptor"]["type_map"] = copy.deepcopy(data["type_map"])
+    descriptor = BaseDescriptor(**data["descriptor"])
+
+    # fitting
+    fitting_net = data.get("fitting_net", {})
+    fitting_net["type"] = fitting_net.get("type", "ener")
+    fitting_net["ntypes"] = descriptor.get_ntypes()
+    fitting_net["type_map"] = copy.deepcopy(data["type_map"])
+    fitting_net["mixed_types"] = descriptor.mixed_types()
+    if fitting_net["type"] in ["dipole", "polar"]:
+        fitting_net["embedding_width"] = descriptor.get_dim_emb()
+    fitting_net["dim_descrpt"] = descriptor.get_dim_out()
+    grad_force = "direct" not in fitting_net["type"]
+    if not grad_force:
+        fitting_net["out_dim"] = descriptor.get_dim_emb()
+        if "ener" in fitting_net["type"]:
+            fitting_net["return_energy"] = True
+    fitting = BaseFitting(**fitting_net)
+    return descriptor, fitting, fitting_net["type"]
+
+
+def get_standard_model(data: dict) -> EnergyModel:
+    """Get a standard model from a config dictionary.
+
+    Parameters
+    ----------
+    data : dict
+        The data to construct the model.
+    """
+    data = copy.deepcopy(data)
+    ntypes = len(data["type_map"])
+    descriptor, fitting, fitting_net_type = _get_standard_model_components(data, ntypes)
+    atom_exclude_types = data.get("atom_exclude_types", [])
+    pair_exclude_types = data.get("pair_exclude_types", [])
+
+    if fitting_net_type == "dipole":
+        modelcls = DipoleModel
+    elif fitting_net_type == "polar":
+        modelcls = PolarModel
+    elif fitting_net_type == "dos":
+        modelcls = DOSModel
+    elif fitting_net_type in ["ener", "direct_force_ener"]:
+        modelcls = EnergyModel
+    elif fitting_net_type == "property":
+        modelcls = PropertyModel
+    else:
+        raise RuntimeError(f"Unknown fitting type: {fitting_net_type}")
+
+    model = modelcls(
+        descriptor=descriptor,
+        fitting=fitting,
+        type_map=data["type_map"],
+        atom_exclude_types=atom_exclude_types,
+        pair_exclude_types=pair_exclude_types,
+    )
+    return model
+
+
+def get_model(data: dict) -> BaseModel:
+    """Get a model from a config dictionary.
+
+    Parameters
+    ----------
+    data : dict
+        The data to construct the model.
+    """
+    model_type = data.get("type", "standard")
+    if model_type == "standard":
+        return get_standard_model(data)
+    else:
+        return BaseModel.get_class_by_type(model_type).get_model(data)
diff --git a/deepmd/pt_expt/train/__init__.py b/deepmd/pt_expt/train/__init__.py
new file mode 100644
index 0000000000..6ceb116d85
--- /dev/null
+++ b/deepmd/pt_expt/train/__init__.py
@@ -0,0 +1 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
new file mode 100644
index 0000000000..6628d3e10e
--- /dev/null
+++ b/deepmd/pt_expt/train/training.py
@@ -0,0 +1,502 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Training loop for the pt_expt backend.
+
+Uses ``DeepmdDataSystem`` (numpy-based batch provider) instead of the
+pt backend's ``DpLoaderSet`` + ``DataLoader``.  NumPy batches are
+converted to torch tensors at the boundary.
+"""
+
+import functools
+import logging
+import time
+from copy import (
+    deepcopy,
+)
+from pathlib import (
+    Path,
+)
+from typing import (
+    Any,
+)
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.utils.learning_rate import (
+    LearningRateExp,
+)
+from deepmd.loggers.training import (
+    format_training_message_per_task,
+)
+from deepmd.pt.loss import (
+    EnergyHessianStdLoss,
+    EnergyStdLoss,
+    TaskLoss,
+)
+from deepmd.pt_expt.model import (
+    get_model,
+)
+from deepmd.pt_expt.train.wrapper import (
+    ModelWrapper,
+)
+from deepmd.pt_expt.utils.env import (
+    DEVICE,
+    GLOBAL_PT_FLOAT_PRECISION,
+)
+from deepmd.pt_expt.utils.stat import (
+    make_stat_input,
+)
+from deepmd.utils.data import (
+    DataRequirementItem,
+)
+from deepmd.utils.data_system import (
+    DeepmdDataSystem,
+)
+from deepmd.utils.path import (
+    DPPath,
+)
+
+log = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Helper: loss factory (reused from pt)
+# ---------------------------------------------------------------------------
+
+
+def get_loss(
+    loss_params: dict[str, Any],
+    start_lr: float,
+    _ntypes: int,
+    _model: Any,
+) -> TaskLoss:
+    loss_type = loss_params.get("type", "ener")
+    if loss_type == "ener" and loss_params.get("start_pref_h", 0.0) > 0.0:
+        loss_params["starter_learning_rate"] = start_lr
+        return EnergyHessianStdLoss(**loss_params)
+    elif loss_type == "ener":
+        loss_params["starter_learning_rate"] = start_lr
+        return EnergyStdLoss(**loss_params)
+    else:
+        loss_params["starter_learning_rate"] = start_lr
+        return TaskLoss.get_class_by_type(loss_type).get_loss(loss_params)
+
+
+def get_additional_data_requirement(_model: Any) -> list[DataRequirementItem]:
+    additional_data_requirement: list[DataRequirementItem] = []
+    if _model.get_dim_fparam() > 0:
+        additional_data_requirement.append(
+            DataRequirementItem(
+                "fparam",
+                _model.get_dim_fparam(),
+                atomic=False,
+                must=False,
+                default=0.0,
+            )
+        )
+    if _model.get_dim_aparam() > 0:
+        additional_data_requirement.append(
+            DataRequirementItem(
+                "aparam", _model.get_dim_aparam(), atomic=True, must=True
+            )
+        )
+    return additional_data_requirement
+
+
+# ---------------------------------------------------------------------------
+# Trainer
+# ---------------------------------------------------------------------------
+
+
+class Trainer:
+    """Training driver for the pt_expt backend.
+
+    Uses ``DeepmdDataSystem`` for data loading (numpy batches converted
+    to torch tensors at the boundary).  Single-task, single-GPU only.
+
+    Parameters
+    ----------
+    config : dict
+        Full training configuration.
+    training_data : DeepmdDataSystem
+        Training data.
+    stat_file_path : DPPath or None
+        Path for saving / loading statistics.
+    validation_data : DeepmdDataSystem or None
+        Validation data.
+    init_model : str or None
+        Path to a checkpoint to initialise weights from.
+    restart_model : str or None
+        Path to a checkpoint to *restart* training from (restores step + optimiser).
+    """
+
+    def __init__(
+        self,
+        config: dict[str, Any],
+        training_data: DeepmdDataSystem,
+        stat_file_path: DPPath | None = None,
+        validation_data: DeepmdDataSystem | None = None,
+        init_model: str | None = None,
+        restart_model: str | None = None,
+    ) -> None:
+        resume_model = init_model or restart_model
+        resuming = resume_model is not None
+        self.restart_training = restart_model is not None
+
+        model_params = config["model"]
+        training_params = config["training"]
+
+        # Iteration config
+        self.num_steps = training_params["numb_steps"]
+        self.disp_file = training_params.get("disp_file", "lcurve.out")
+        self.disp_freq = training_params.get("disp_freq", 1000)
+        self.save_ckpt = training_params.get("save_ckpt", "model.ckpt")
+        self.save_freq = training_params.get("save_freq", 1000)
+        self.display_in_training = training_params.get("disp_training", True)
+        self.timing_in_training = training_params.get("time_training", True)
+        self.lcurve_should_print_header = True
+
+        # Model ---------------------------------------------------------------
+        self.model = get_model(deepcopy(model_params)).to(DEVICE)
+
+        # Loss ----------------------------------------------------------------
+        self.loss = get_loss(
+            config.get("loss", {}),
+            config["learning_rate"]["start_lr"],
+            len(model_params["type_map"]),
+            self.model,
+        )
+
+        # Data requirements ---------------------------------------------------
+        data_requirement = self.loss.label_requirement
+        data_requirement += get_additional_data_requirement(self.model)
+        training_data.add_data_requirements(data_requirement)
+        if validation_data is not None:
+            validation_data.add_data_requirements(data_requirement)
+
+        self.training_data = training_data
+        self.validation_data = validation_data
+        self.valid_numb_batch = training_params.get("validation_data", {}).get(
+            "numb_btch", 1
+        )
+
+        # Statistics ----------------------------------------------------------
+        data_stat_nbatch = model_params.get("data_stat_nbatch", 10)
+
+        @functools.lru_cache
+        def get_sample() -> list[dict[str, np.ndarray]]:
+            return make_stat_input(training_data, data_stat_nbatch)
+
+        if not resuming:
+            self.model.compute_or_load_stat(
+                sampled_func=get_sample,
+                stat_file_path=stat_file_path,
+            )
+
+        # Learning rate -------------------------------------------------------
+        lr_params = config["learning_rate"].copy()
+        lr_params["stop_steps"] = self.num_steps
+        self.lr_schedule = LearningRateExp(**lr_params)
+
+        # Gradient clipping
+        self.gradient_max_norm = training_params.get("gradient_max_norm", 0.0)
+
+        # Model wrapper -------------------------------------------------------
+        self.wrapper = ModelWrapper(self.model, self.loss, model_params=model_params)
+        self.start_step = 0
+
+        # Optimiser -----------------------------------------------------------
+        opt_type = training_params.get("opt_type", "Adam")
+        initial_lr = float(self.lr_schedule.value(self.start_step))
+
+        if opt_type == "Adam":
+            self.optimizer = torch.optim.Adam(self.wrapper.parameters(), lr=initial_lr)
+        elif opt_type == "AdamW":
+            weight_decay = training_params.get("weight_decay", 0.001)
+            self.optimizer = torch.optim.AdamW(
+                self.wrapper.parameters(),
+                lr=initial_lr,
+                weight_decay=weight_decay,
+            )
+        else:
+            raise ValueError(f"Unsupported optimizer type: {opt_type}")
+
+        self.scheduler = torch.optim.lr_scheduler.LambdaLR(
+            self.optimizer,
+            lambda step: self.lr_schedule.value(step + self.start_step) / initial_lr,
+            last_epoch=self.start_step - 1,
+        )
+
+        # Resume --------------------------------------------------------------
+        if resuming:
+            log.info(f"Resuming from {resume_model}.")
+            state_dict = torch.load(
+                resume_model, map_location=DEVICE, weights_only=True
+            )
+            if "model" in state_dict:
+                optimizer_state_dict = (
+                    state_dict["optimizer"] if self.restart_training else None
+                )
+                state_dict = state_dict["model"]
+            else:
+                optimizer_state_dict = None
+
+            self.start_step = (
+                state_dict["_extra_state"]["train_infos"]["step"]
+                if self.restart_training
+                else 0
+            )
+            self.wrapper.load_state_dict(state_dict)
+            if optimizer_state_dict is not None:
+                self.optimizer.load_state_dict(optimizer_state_dict)
+                # rebuild scheduler from the resumed step
+                self.scheduler = torch.optim.lr_scheduler.LambdaLR(
+                    self.optimizer,
+                    lambda step: (
+                        self.lr_schedule.value(step + self.start_step) / initial_lr
+                    ),
+                    last_epoch=self.start_step - 1,
+                )
+
+    # ------------------------------------------------------------------
+    # Data helpers
+    # ------------------------------------------------------------------
+
+    def get_data(
+        self,
+        is_train: bool = True,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Fetch a batch and split into input / label dicts.
+
+        Returns
+        -------
+        input_dict, label_dict
+        """
+        data_sys = self.training_data if is_train else self.validation_data
+        if data_sys is None:
+            return {}, {}
+
+        batch = data_sys.get_batch()  # numpy dict
+
+        input_keys = {"coord", "box", "fparam", "aparam"}
+        input_dict: dict[str, Any] = {}
+        label_dict: dict[str, Any] = {}
+
+        natoms = batch["type"].shape[-1]
+
+        for key, val in batch.items():
+            if key == "type":
+                # rename to atype; convert to int64 tensor
+                input_dict["atype"] = torch.from_numpy(val.astype(np.int64)).to(DEVICE)
+            elif key == "coord":
+                # reshape from [nf, natoms*3] → [nf, natoms, 3]
+                t = torch.from_numpy(val.copy()).to(
+                    dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                )
+                # requires_grad needed for force computation via autograd
+                input_dict["coord"] = t.reshape(-1, natoms, 3).requires_grad_(True)
+            elif key == "box":
+                if val is not None:
+                    t = torch.from_numpy(val).to(
+                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                    )
+                    input_dict["box"] = t.reshape(-1, 3, 3)
+                else:
+                    input_dict["box"] = None
+            elif key in input_keys:
+                if val is not None and isinstance(val, np.ndarray):
+                    input_dict[key] = torch.from_numpy(val).to(
+                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                    )
+            elif key in ("natoms_vec", "default_mesh", "sid", "fid"):
+                continue
+            elif "find_" in key:
+                # find_energy, find_force, … — keep as float scalar
+                label_dict[key] = float(val) if not isinstance(val, float) else val
+            elif key == "force":
+                # [nf, natoms*3] → [nf, natoms, 3]
+                t = torch.from_numpy(val).to(
+                    dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                )
+                label_dict["force"] = t.reshape(-1, natoms, 3)
+            else:
+                if isinstance(val, np.ndarray):
+                    label_dict[key] = torch.from_numpy(val).to(
+                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                    )
+                else:
+                    label_dict[key] = val
+
+        return input_dict, label_dict
+
+    # ------------------------------------------------------------------
+    # Checkpointing
+    # ------------------------------------------------------------------
+
+    def save_checkpoint(self, step: int) -> None:
+        self.wrapper.train_infos["step"] = step
+        state = {
+            "model": self.wrapper.state_dict(),
+            "optimizer": self.optimizer.state_dict(),
+        }
+        ckpt_path = f"{self.save_ckpt}-{step}.pt"
+        torch.save(state, ckpt_path)
+        # symlink latest
+        latest = Path(f"{self.save_ckpt}.pt")
+        if latest.is_symlink() or latest.exists():
+            latest.unlink()
+        latest.symlink_to(ckpt_path)
+        log.info(f"Saved checkpoint to {ckpt_path}")
+
+    # ------------------------------------------------------------------
+    # Training loop
+    # ------------------------------------------------------------------
+
+    def run(self) -> None:
+        fout = open(
+            self.disp_file,
+            mode="w" if not self.restart_training else "a",
+            buffering=1,
+        )
+        log.info("Start to train %d steps.", self.num_steps)
+
+        self.wrapper.train()
+
+        for step_id in range(self.start_step, self.num_steps):
+            cur_lr = float(self.lr_schedule.value(step_id))
+
+            if self.timing_in_training:
+                t_start = time.time()
+
+            # --- forward / backward ---
+            self.optimizer.zero_grad(set_to_none=True)
+            input_dict, label_dict = self.get_data(is_train=True)
+
+            cur_lr_sched = self.scheduler.get_last_lr()[0]
+            model_pred, loss, more_loss = self.wrapper(
+                **input_dict, cur_lr=cur_lr_sched, label=label_dict
+            )
+            loss.backward()
+
+            if self.gradient_max_norm > 0.0:
+                torch.nn.utils.clip_grad_norm_(
+                    self.wrapper.parameters(), self.gradient_max_norm
+                )
+
+            self.optimizer.step()
+            self.scheduler.step()
+
+            if self.timing_in_training:
+                t_end = time.time()
+
+            # --- display ---
+            display_step_id = step_id + 1
+            if self.display_in_training and (
+                display_step_id % self.disp_freq == 0 or display_step_id == 1
+            ):
+                self.wrapper.eval()
+
+                train_results = {k: v for k, v in more_loss.items() if "l2_" not in k}
+
+                # validation
+                valid_results: dict[str, Any] = {}
+                if self.validation_data is not None:
+                    sum_natoms = 0
+                    for _ii in range(self.valid_numb_batch):
+                        val_input, val_label = self.get_data(is_train=False)
+                        if not val_input:
+                            break
+                        _, _vloss, _vmore = self.wrapper(
+                            **val_input, cur_lr=cur_lr_sched, label=val_label
+                        )
+                        natoms = int(val_input["atype"].shape[-1])
+                        sum_natoms += natoms
+                        for k, v in _vmore.items():
+                            if "l2_" not in k:
+                                valid_results[k] = (
+                                    valid_results.get(k, 0.0) + v * natoms
+                                )
+                    if sum_natoms > 0:
+                        valid_results = {
+                            k: v / sum_natoms for k, v in valid_results.items()
+                        }
+
+                # log
+                log.info(
+                    format_training_message_per_task(
+                        batch=display_step_id,
+                        task_name="trn",
+                        rmse=train_results,
+                        learning_rate=cur_lr,
+                    )
+                )
+                if valid_results:
+                    log.info(
+                        format_training_message_per_task(
+                            batch=display_step_id,
+                            task_name="val",
+                            rmse=valid_results,
+                            learning_rate=None,
+                        )
+                    )
+
+                # lcurve file
+                if self.lcurve_should_print_header:
+                    self.print_header(fout, train_results, valid_results)
+                    self.lcurve_should_print_header = False
+                self.print_on_training(
+                    fout, display_step_id, cur_lr, train_results, valid_results
+                )
+
+                self.wrapper.train()
+
+            # --- checkpoint ---
+            if display_step_id % self.save_freq == 0:
+                self.save_checkpoint(display_step_id)
+
+        # final save
+        self.save_checkpoint(self.num_steps)
+        fout.close()
+        log.info("Training finished.")
+
+    # ------------------------------------------------------------------
+    # Printing helpers
+    # ------------------------------------------------------------------
+
+    def print_header(
+        self,
+        fout: Any,
+        train_results: dict[str, Any],
+        valid_results: dict[str, Any],
+    ) -> None:
+        train_keys = sorted(train_results.keys())
+        header = "# {:5s}".format("step")
+        if valid_results:
+            for k in train_keys:
+                header += f"   {k + '_val':>11s} {k + '_trn':>11s}"
+        else:
+            for k in train_keys:
+                header += f"   {k + '_trn':>11s}"
+        header += "   {:8s}\n".format("lr")
+        fout.write(header)
+        fout.flush()
+
+    def print_on_training(
+        self,
+        fout: Any,
+        step_id: int,
+        cur_lr: float,
+        train_results: dict,
+        valid_results: dict,
+    ) -> None:
+        train_keys = sorted(train_results.keys())
+        line = f"{step_id:7d}"
+        if valid_results:
+            for k in train_keys:
+                line += f"   {valid_results.get(k, float('nan')):11.2e} {train_results[k]:11.2e}"
+        else:
+            for k in train_keys:
+                line += f"   {train_results[k]:11.2e}"
+        line += f"   {cur_lr:8.1e}\n"
+        fout.write(line)
+        fout.flush()
diff --git a/deepmd/pt_expt/train/wrapper.py b/deepmd/pt_expt/train/wrapper.py
new file mode 100644
index 0000000000..d646cb79ab
--- /dev/null
+++ b/deepmd/pt_expt/train/wrapper.py
@@ -0,0 +1,85 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import logging
+from typing import (
+    Any,
+)
+
+import torch
+
+log = logging.getLogger(__name__)
+
+
+class ModelWrapper(torch.nn.Module):
+    """Simplified model wrapper that bundles a model and a loss.
+
+    Single-task only for now (no multi-task support).
+
+    Parameters
+    ----------
+    model : torch.nn.Module
+        The model to train.
+    loss : torch.nn.Module
+        The loss module.
+    model_params : dict, optional
+        Model parameters to store as extra state.
+    """
+
+    def __init__(
+        self,
+        model: torch.nn.Module,
+        loss: torch.nn.Module | None = None,
+        model_params: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__()
+        self.model_params = model_params if model_params is not None else {}
+        self.train_infos: dict[str, Any] = {
+            "lr": 0,
+            "step": 0,
+        }
+        self.model = model
+        self.loss = loss
+        self.inference_only = self.loss is None
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        cur_lr: float | torch.Tensor | None = None,
+        label: dict[str, torch.Tensor] | None = None,
+        do_atomic_virial: bool = False,
+    ) -> tuple[dict[str, torch.Tensor], torch.Tensor | None, dict | None]:
+        input_dict = {
+            "coord": coord,
+            "atype": atype,
+            "box": box,
+            "do_atomic_virial": do_atomic_virial,
+            "fparam": fparam,
+            "aparam": aparam,
+        }
+
+        if self.inference_only or label is None:
+            model_pred = self.model(**input_dict)
+            return model_pred, None, None
+        else:
+            natoms = atype.shape[-1]
+            model_pred, loss, more_loss = self.loss(
+                input_dict,
+                self.model,
+                label,
+                natoms=natoms,
+                learning_rate=cur_lr,
+            )
+            return model_pred, loss, more_loss
+
+    def set_extra_state(self, state: dict) -> None:
+        self.model_params = state.get("model_params", {})
+        self.train_infos = state.get("train_infos", {"lr": 0, "step": 0})
+
+    def get_extra_state(self) -> dict:
+        return {
+            "model_params": self.model_params,
+            "train_infos": self.train_infos,
+        }
diff --git a/deepmd/pt_expt/utils/stat.py b/deepmd/pt_expt/utils/stat.py
new file mode 100644
index 0000000000..50044f8028
--- /dev/null
+++ b/deepmd/pt_expt/utils/stat.py
@@ -0,0 +1,85 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+import logging
+
+import numpy as np
+
+from deepmd.utils.data_system import (
+    DeepmdDataSystem,
+)
+from deepmd.utils.model_stat import make_stat_input as _make_stat_input_raw
+
+log = logging.getLogger(__name__)
+
+
+def make_stat_input(
+    data: DeepmdDataSystem,
+    nbatches: int,
+) -> list[dict[str, np.ndarray]]:
+    """Pack data for statistics using DeepmdDataSystem.
+
+    Collects *nbatches* batches from each system and concatenates them
+    into a single dict per system.  The returned format matches the
+    ``list[dict[str, np.ndarray]]`` expected by
+    ``compute_or_load_stat``.
+
+    Parameters
+    ----------
+    data : DeepmdDataSystem
+        The multi-system data manager.
+    nbatches : int
+        Number of batches to collect per system.
+
+    Returns
+    -------
+    list[dict[str, np.ndarray]]
+        Per-system dicts with concatenated numpy arrays.
+    """
+    # Reuse the shared helper with merge_sys=False so that data is
+    # grouped by system:  all_stat[key][sys_idx] = [batch0, batch1, ...]
+    all_stat = _make_stat_input_raw(data, nbatches, merge_sys=False)
+
+    nsystems = data.get_nsystems()
+    log.info(f"Packing data for statistics from {nsystems} systems")
+
+    # Transpose dict-of-lists-of-lists → list-of-dicts and concatenate
+    # batches within each system.
+    keys = list(all_stat.keys())
+    lst: list[dict[str, np.ndarray]] = []
+    for ii in range(nsystems):
+        merged: dict[str, np.ndarray] = {}
+        for key in keys:
+            vals = all_stat[key][ii]  # list of batch arrays for this system
+            if isinstance(vals[0], np.ndarray):
+                if vals[0].ndim >= 2:
+                    # 2D+ arrays (e.g. coord [nf, natoms*3]) — concat along axis 0
+                    merged[key] = np.concatenate(vals, axis=0)
+                else:
+                    # 1D arrays (e.g. natoms_vec [2+ntypes]) — per-system
+                    # constant, just keep one copy
+                    merged[key] = vals[0]
+            else:
+                # scalar flags like find_*
+                merged[key] = vals[0]
+
+        # DeepmdDataSystem.get_batch() uses "type" but the stat system
+        # (env_mat_stat, compute_output_stats, etc.) expects "atype".
+        if "type" in merged and "atype" not in merged:
+            merged["atype"] = merged.pop("type")
+
+        # Reshape coord from [nf, natoms*3] → [nf, natoms, 3]
+        if "atype" in merged and "coord" in merged:
+            natoms = merged["atype"].shape[-1]
+            merged["coord"] = merged["coord"].reshape(-1, natoms, 3)
+
+        # Provide "natoms" from "natoms_vec" (expected by stat system).
+        # natoms_vec from get_batch() is 1D [2+ntypes], but
+        # compute_output_stats expects 2D [nframes, 2+ntypes].
+        if "natoms_vec" in merged and "natoms" not in merged:
+            nv = merged["natoms_vec"]
+            if nv.ndim == 1:
+                nframes = merged["coord"].shape[0]
+                nv = np.tile(nv, (nframes, 1))
+            merged["natoms"] = nv
+
+        lst.append(merged)
+    return lst
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
new file mode 100644
index 0000000000..4299b10f19
--- /dev/null
+++ b/source/tests/pt_expt/test_training.py
@@ -0,0 +1,212 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Smoke test for the pt_expt training infrastructure.
+
+Verifies that:
+1. ``get_model`` constructs a model from config
+2. ``make_stat_input`` + ``compute_or_load_stat`` work
+3. A few training steps run without error
+4. Loss decreases over those steps
+"""
+
+import os
+import shutil
+import tempfile
+import unittest
+
+import torch
+
+from deepmd.utils.argcheck import (
+    normalize,
+)
+from deepmd.utils.compat import (
+    update_deepmd_input,
+)
+
+torch = torch  # ensure torch is imported before pt_expt
+
+from deepmd.pt_expt.entrypoints.main import (
+    get_trainer,
+)
+from deepmd.pt_expt.model import (
+    get_model,
+)
+
+EXAMPLE_DIR = os.path.join(
+    os.path.dirname(__file__),
+    "..",
+    "..",
+    "..",
+    "examples",
+    "water",
+)
+
+
+def _make_config(data_dir: str, numb_steps: int = 20) -> dict:
+    """Build a minimal config dict pointing at *data_dir*."""
+    config = {
+        "model": {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": [46, 92],
+                "rcut_smth": 0.50,
+                "rcut": 6.00,
+                "neuron": [25, 50, 100],
+                "resnet_dt": False,
+                "axis_neuron": 16,
+                "seed": 1,
+            },
+            "fitting_net": {
+                "neuron": [240, 240, 240],
+                "resnet_dt": True,
+                "seed": 1,
+            },
+            "data_stat_nbatch": 2,
+        },
+        "learning_rate": {
+            "type": "exp",
+            "decay_steps": 500,
+            "start_lr": 0.001,
+            "stop_lr": 3.51e-8,
+        },
+        "loss": {
+            "type": "ener",
+            "start_pref_e": 0.02,
+            "limit_pref_e": 1,
+            "start_pref_f": 1000,
+            "limit_pref_f": 1,
+            "start_pref_v": 0,
+            "limit_pref_v": 0,
+        },
+        "training": {
+            "training_data": {
+                "systems": [
+                    os.path.join(data_dir, "data_0"),
+                    os.path.join(data_dir, "data_1"),
+                    os.path.join(data_dir, "data_2"),
+                ],
+                "batch_size": 1,
+            },
+            "validation_data": {
+                "systems": [
+                    os.path.join(data_dir, "data_3"),
+                ],
+                "batch_size": 1,
+                "numb_btch": 1,
+            },
+            "numb_steps": numb_steps,
+            "seed": 10,
+            "disp_file": "lcurve.out",
+            "disp_freq": 5,
+            "save_freq": numb_steps,
+        },
+    }
+    return config
+
+
+class TestTraining(unittest.TestCase):
+    """Basic smoke test for the pt_expt training loop."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def test_get_model(self) -> None:
+        """Test that get_model constructs a model from config."""
+        config = _make_config(self.data_dir)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+        model = get_model(config["model"])
+        # model should be a torch.nn.Module
+        self.assertIsInstance(model, torch.nn.Module)
+        # should have parameters
+        nparams = sum(p.numel() for p in model.parameters())
+        self.assertGreater(nparams, 0)
+
+    def test_training_loop(self) -> None:
+        """Run a few training steps and check loss decreases."""
+        nsteps = 20
+        config = _make_config(self.data_dir, numb_steps=nsteps)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_train_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                trainer = get_trainer(config)
+
+                # Collect losses over training
+                losses = []
+                orig_step = trainer.run.__code__
+
+                # Instead of monkey-patching, just run and check the lcurve
+                trainer.run()
+
+                # Read lcurve to verify training ran
+                lcurve_path = os.path.join(tmpdir, "lcurve.out")
+                self.assertTrue(os.path.exists(lcurve_path), "lcurve.out not created")
+
+                with open(lcurve_path) as f:
+                    lines = [l for l in f.readlines() if not l.startswith("#")]
+                self.assertGreater(len(lines), 0, "lcurve.out is empty")
+
+                # Verify checkpoint was saved
+                ckpt_files = [f for f in os.listdir(tmpdir) if f.endswith(".pt")]
+                self.assertGreater(len(ckpt_files), 0, "No checkpoint files saved")
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
+class TestGetData(unittest.TestCase):
+    """Test the batch data conversion in Trainer.get_data."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def test_batch_shapes(self) -> None:
+        """Verify input/label shapes from get_data."""
+        config = _make_config(self.data_dir, numb_steps=5)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_getdata_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                trainer = get_trainer(config)
+                input_dict, label_dict = trainer.get_data(is_train=True)
+
+                # coord should be [nf, natoms, 3]
+                self.assertEqual(len(input_dict["coord"].shape), 3)
+                self.assertEqual(input_dict["coord"].shape[-1], 3)
+
+                # atype should be [nf, natoms]
+                self.assertEqual(len(input_dict["atype"].shape), 2)
+
+                # force label should be [nf, natoms, 3]
+                if "force" in label_dict:
+                    self.assertEqual(len(label_dict["force"].shape), 3)
+                    self.assertEqual(label_dict["force"].shape[-1], 3)
+
+                # energy label should exist
+                self.assertIn("energy", label_dict)
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
+if __name__ == "__main__":
+    unittest.main()

From 8be14bf70a16542c6cb552cce1697b6dd666bbf6 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 16:15:51 +0800
Subject: [PATCH 43/63] fix bug in test

---
 deepmd/pt_expt/train/training.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 6628d3e10e..81843383c7 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -195,7 +195,7 @@ def get_sample() -> list[dict[str, np.ndarray]]:
 
         # Learning rate -------------------------------------------------------
         lr_params = config["learning_rate"].copy()
-        lr_params["stop_steps"] = self.num_steps
+        lr_params["num_steps"] = self.num_steps
         self.lr_schedule = LearningRateExp(**lr_params)
 
         # Gradient clipping

From f3e1b905b69a20bd05eac2a46880de1fbe98e733 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 18:12:43 +0800
Subject: [PATCH 44/63] enable model compile. print wall-time in stdout

---
 deepmd/pt_expt/train/training.py      | 226 +++++++++++++++++++++++++-
 deepmd/utils/argcheck.py              |  12 ++
 source/tests/pt_expt/test_training.py |  47 +++---
 3 files changed, 262 insertions(+), 23 deletions(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 81843383c7..22f3db59e6 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -227,6 +227,20 @@ def get_sample() -> list[dict[str, np.ndarray]]:
             last_epoch=self.start_step - 1,
         )
 
+        # torch.compile -------------------------------------------------------
+        # The model's forward uses torch.autograd.grad (for forces) with
+        # create_graph=True so the loss backward can differentiate through
+        # forces.  torch.compile does not support this "double backward".
+        #
+        # Solution: use make_fx to trace the model forward, which decomposes
+        # torch.autograd.grad into primitive ops.  The resulting traced
+        # module is then compiled by torch.compile — no double backward.
+        self.enable_compile = training_params.get("enable_compile", False)
+        if self.enable_compile:
+            compile_opts = training_params.get("compile_options", {})
+            log.info("Compiling model with torch.compile (%s)", compile_opts)
+            self._compile_model(compile_opts)
+
         # Resume --------------------------------------------------------------
         if resuming:
             log.info(f"Resuming from {resume_model}.")
@@ -258,6 +272,201 @@ def get_sample() -> list[dict[str, np.ndarray]]:
                     last_epoch=self.start_step - 1,
                 )
 
+    # ------------------------------------------------------------------
+    # torch.compile helpers
+    # ------------------------------------------------------------------
+
+    def _compile_model(self, compile_opts: dict[str, Any]) -> None:
+        """Replace ``self.model`` with a compiled version.
+
+        The model's ``forward`` uses ``torch.autograd.grad`` (for force
+        computation) with ``create_graph=True``, which creates a "double
+        backward" that ``torch.compile`` cannot handle.
+
+        Solution: use ``forward_lower_exportable`` (``make_fx`` trace) to
+        decompose ``torch.autograd.grad`` into primitive ops.  The coord
+        extension + nlist build (which contain data-dependent control flow)
+        are kept outside the compiled region.  The traced ``forward_lower``
+        module is then compiled by ``torch.compile``.
+        """
+        from deepmd.dpmodel.utils.nlist import (
+            build_neighbor_list,
+            extend_coord_with_ghosts,
+        )
+        from deepmd.dpmodel.utils.region import (
+            normalize_coord,
+        )
+
+        model = self.model
+
+        # --- Build sample extended inputs for tracing ---
+        sample_input, _ = self.get_data(is_train=True)
+        coord = sample_input["coord"].detach()
+        atype = sample_input["atype"].detach()
+        box = sample_input.get("box")
+        if box is not None:
+            box = box.detach()
+
+        nframes, nloc = atype.shape[:2]
+        coord_np = coord.cpu().numpy().reshape(nframes, nloc, 3)
+        atype_np = atype.cpu().numpy()
+        box_np = box.cpu().numpy().reshape(nframes, 9) if box is not None else None
+
+        if box_np is not None:
+            coord_norm = normalize_coord(coord_np, box_np.reshape(nframes, 3, 3))
+        else:
+            coord_norm = coord_np
+
+        ext_coord_np, ext_atype_np, mapping_np = extend_coord_with_ghosts(
+            coord_norm, atype_np, box_np, model.get_rcut()
+        )
+        nlist_np = build_neighbor_list(
+            ext_coord_np,
+            ext_atype_np,
+            nloc,
+            model.get_rcut(),
+            model.get_sel(),
+            distinguish_types=False,
+        )
+        ext_coord_np = ext_coord_np.reshape(nframes, -1, 3)
+
+        ext_coord = torch.tensor(
+            ext_coord_np, dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+        )
+        ext_atype = torch.tensor(ext_atype_np, dtype=torch.int64, device=DEVICE)
+        nlist_t = torch.tensor(nlist_np, dtype=torch.int64, device=DEVICE)
+        mapping_t = torch.tensor(mapping_np, dtype=torch.int64, device=DEVICE)
+        fparam = sample_input.get("fparam")
+        aparam = sample_input.get("aparam")
+
+        # --- Trace forward_lower with make_fx ---
+        # Tracing must happen in eval mode (create_graph=False) to avoid
+        # double-backward complexity that make_fx cannot handle.
+        # The traced module still produces correct force *values*; we just
+        # don't need create_graph=True because torch.compile handles the
+        # backward pass through the traced primitive ops.
+        #
+        # Use tracing_mode="symbolic" so that nall (number of extended
+        # atoms) is treated as a dynamic dimension — different batches may
+        # have different numbers of ghost atoms.
+        from torch.fx.experimental.proxy_tensor import (
+            make_fx,
+        )
+
+        model.eval()
+
+        def fn(
+            extended_coord: torch.Tensor,
+            extended_atype: torch.Tensor,
+            nlist: torch.Tensor,
+            mapping: torch.Tensor | None,
+            fparam: torch.Tensor | None,
+            aparam: torch.Tensor | None,
+        ) -> dict[str, torch.Tensor]:
+            extended_coord = extended_coord.detach().requires_grad_(True)
+            return model.forward_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fparam=fparam,
+                aparam=aparam,
+            )
+
+        traced_lower = make_fx(
+            fn,
+            tracing_mode="symbolic",
+            _allow_non_fake_inputs=True,
+        )(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
+        model.train()
+
+        # --- Compile the traced module ---
+        # nall (number of extended atoms) varies per batch, so enable
+        # dynamic shapes to avoid recompilation on every shape change.
+        compile_opts.setdefault("dynamic", True)
+        compiled_lower = torch.compile(traced_lower, **compile_opts)
+
+        # --- Build a wrapper that does coord-extension then compiled lower ---
+        class _CompiledModel(torch.nn.Module):
+            """Thin wrapper: coord extension (untraced) → compiled forward_lower."""
+
+            def __init__(
+                self,
+                original_model: torch.nn.Module,
+                compiled_forward_lower: torch.nn.Module,
+            ) -> None:
+                super().__init__()
+                self.original_model = original_model
+                self.compiled_forward_lower = compiled_forward_lower
+
+            def forward(
+                self,
+                coord: torch.Tensor,
+                atype: torch.Tensor,
+                box: torch.Tensor | None = None,
+                fparam: torch.Tensor | None = None,
+                aparam: torch.Tensor | None = None,
+                do_atomic_virial: bool = False,
+            ) -> dict[str, torch.Tensor]:
+                nframes, nloc = atype.shape[:2]
+                rcut = self.original_model.get_rcut()
+                sel = self.original_model.get_sel()
+
+                # coord extension + nlist (data-dependent, run in eager on device)
+                coord_3d = coord.detach().reshape(nframes, nloc, 3)
+                box_flat = box.detach().reshape(nframes, 9) if box is not None else None
+
+                if box_flat is not None:
+                    coord_norm = normalize_coord(
+                        coord_3d, box_flat.reshape(nframes, 3, 3)
+                    )
+                else:
+                    coord_norm = coord_3d
+
+                ext_coord, ext_atype, mapping = extend_coord_with_ghosts(
+                    coord_norm, atype, box_flat, rcut
+                )
+                nlist = build_neighbor_list(
+                    ext_coord,
+                    ext_atype,
+                    nloc,
+                    rcut,
+                    sel,
+                    distinguish_types=False,
+                )
+                ext_coord = ext_coord.reshape(nframes, -1, 3)
+                ext_coord = ext_coord.detach().requires_grad_(True)
+
+                # compiled forward_lower (autograd decomposed, no double backward)
+                result = self.compiled_forward_lower(
+                    ext_coord,
+                    ext_atype,
+                    nlist,
+                    mapping,
+                    fparam,
+                    aparam,
+                )
+
+                # Translate forward_lower keys → forward keys
+                out: dict[str, torch.Tensor] = {}
+                out["atom_energy"] = result["atom_energy"]
+                out["energy"] = result["energy"]
+                if "extended_force" in result:
+                    # extract local atoms only: [nf, nall, 3] → [nf, nloc, 3]
+                    out["force"] = result["extended_force"][:, :nloc, :]
+                if "virial" in result:
+                    out["virial"] = result["virial"]
+                if "extended_virial" in result:
+                    out["extended_virial"] = result["extended_virial"]
+                if "atom_virial" in result:
+                    out["atom_virial"] = result["atom_virial"]
+                if "mask" in result:
+                    out["mask"] = result["mask"]
+                return out
+
+        self.wrapper.model = _CompiledModel(model, compiled_lower)
+        log.info("Model traced with make_fx and compiled with torch.compile.")
+
     # ------------------------------------------------------------------
     # Data helpers
     # ------------------------------------------------------------------
@@ -361,6 +570,7 @@ def run(self) -> None:
         log.info("Start to train %d steps.", self.num_steps)
 
         self.wrapper.train()
+        wall_start = time.time()
 
         for step_id in range(self.start_step, self.num_steps):
             cur_lr = float(self.lr_schedule.value(step_id))
@@ -421,6 +631,19 @@ def run(self) -> None:
                             k: v / sum_natoms for k, v in valid_results.items()
                         }
 
+                # wall-clock time
+                wall_elapsed = time.time() - wall_start
+                if self.timing_in_training:
+                    step_time = t_end - t_start
+                    log.info(
+                        "step=%d  wall=%.2fs  step_time=%.4fs",
+                        display_step_id,
+                        wall_elapsed,
+                        step_time,
+                    )
+                else:
+                    log.info("step=%d  wall=%.2fs", display_step_id, wall_elapsed)
+
                 # log
                 log.info(
                     format_training_message_per_task(
@@ -456,8 +679,9 @@ def run(self) -> None:
 
         # final save
         self.save_checkpoint(self.num_steps)
+        wall_total = time.time() - wall_start
         fout.close()
-        log.info("Training finished.")
+        log.info("Training finished. Total wall time: %.2fs", wall_total)
 
     # ------------------------------------------------------------------
     # Printing helpers
diff --git a/deepmd/utils/argcheck.py b/deepmd/utils/argcheck.py
index eaa0892369..f227b65175 100644
--- a/deepmd/utils/argcheck.py
+++ b/deepmd/utils/argcheck.py
@@ -41,6 +41,7 @@
 
 doc_only_tf_supported = "(Supported Backend: TensorFlow) "
 doc_only_pt_supported = "(Supported Backend: PyTorch) "
+doc_only_pt_expt_supported = "(Supported Backend: PyTorch Exportable) "
 doc_only_pd_supported = "(Supported Backend: Paddle) "
 # descriptors
 doc_loc_frame = "Defines a local frame at each atom, and the compute the descriptor as local coordinates under this frame."
@@ -3617,6 +3618,17 @@ def training_args(
             default=0,
             doc=doc_only_pt_supported + doc_zero_stage,
         ),
+        Argument(
+            "enable_compile",
+            bool,
+            optional=True,
+            default=False,
+            doc=doc_only_pt_expt_supported
+            + "Enable torch.compile to accelerate training. "
+            "Uses make_fx to decompose autograd into primitive ops, "
+            "then compiles with torch.compile/Inductor for kernel fusion. "
+            "The first training step will be slower due to one-time compilation.",
+        ),
     ]
     variants = [
         Variant(
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 4299b10f19..8b3198bf96 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -41,27 +41,28 @@
 )
 
 
-def _make_config(data_dir: str, numb_steps: int = 20) -> dict:
+def _make_config(data_dir: str, numb_steps: int = 5) -> dict:
     """Build a minimal config dict pointing at *data_dir*."""
     config = {
         "model": {
             "type_map": ["O", "H"],
             "descriptor": {
                 "type": "se_e2_a",
-                "sel": [46, 92],
+                "sel": [6, 12],
                 "rcut_smth": 0.50,
-                "rcut": 6.00,
-                "neuron": [25, 50, 100],
+                "rcut": 3.00,
+                "neuron": [8, 16],
                 "resnet_dt": False,
-                "axis_neuron": 16,
+                "axis_neuron": 4,
+                "type_one_side": True,
                 "seed": 1,
             },
             "fitting_net": {
-                "neuron": [240, 240, 240],
+                "neuron": [16, 16],
                 "resnet_dt": True,
                 "seed": 1,
             },
-            "data_stat_nbatch": 2,
+            "data_stat_nbatch": 1,
         },
         "learning_rate": {
             "type": "exp",
@@ -82,8 +83,6 @@ def _make_config(data_dir: str, numb_steps: int = 20) -> dict:
             "training_data": {
                 "systems": [
                     os.path.join(data_dir, "data_0"),
-                    os.path.join(data_dir, "data_1"),
-                    os.path.join(data_dir, "data_2"),
                 ],
                 "batch_size": 1,
             },
@@ -126,25 +125,14 @@ def test_get_model(self) -> None:
         nparams = sum(p.numel() for p in model.parameters())
         self.assertGreater(nparams, 0)
 
-    def test_training_loop(self) -> None:
-        """Run a few training steps and check loss decreases."""
-        nsteps = 20
-        config = _make_config(self.data_dir, numb_steps=nsteps)
-        config = update_deepmd_input(config, warning=False)
-        config = normalize(config)
-
+    def _run_training(self, config: dict) -> None:
+        """Run training and verify lcurve + checkpoint creation."""
         tmpdir = tempfile.mkdtemp(prefix="pt_expt_train_")
         try:
             old_cwd = os.getcwd()
             os.chdir(tmpdir)
             try:
                 trainer = get_trainer(config)
-
-                # Collect losses over training
-                losses = []
-                orig_step = trainer.run.__code__
-
-                # Instead of monkey-patching, just run and check the lcurve
                 trainer.run()
 
                 # Read lcurve to verify training ran
@@ -163,6 +151,21 @@ def test_training_loop(self) -> None:
         finally:
             shutil.rmtree(tmpdir, ignore_errors=True)
 
+    def test_training_loop(self) -> None:
+        """Run a few training steps and verify outputs."""
+        config = _make_config(self.data_dir, numb_steps=5)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+        self._run_training(config)
+
+    def test_training_loop_compiled(self) -> None:
+        """Run a few training steps with torch.compile enabled."""
+        config = _make_config(self.data_dir, numb_steps=5)
+        config["training"]["enable_compile"] = True
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+        self._run_training(config)
+
 
 class TestGetData(unittest.TestCase):
     """Test the batch data conversion in Trainer.get_data."""

From d6cecc2e6d063db31f45594aac6b5ee954a4c79c Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 18:59:20 +0800
Subject: [PATCH 45/63] padding nall so the model is compiled with mode `real`.
  fix bug in env mat.

---
 deepmd/dpmodel/utils/env_mat.py       |   8 +-
 deepmd/pt_expt/train/training.py      | 466 +++++++++++++++++---------
 source/tests/pt_expt/test_training.py |  68 ++++
 3 files changed, 384 insertions(+), 158 deletions(-)

diff --git a/deepmd/dpmodel/utils/env_mat.py b/deepmd/dpmodel/utils/env_mat.py
index 5af7a9fc3c..b979d6a507 100644
--- a/deepmd/dpmodel/utils/env_mat.py
+++ b/deepmd/dpmodel/utils/env_mat.py
@@ -26,7 +26,10 @@ def compute_smooth_weight(
     if rmin >= rmax:
         raise ValueError("rmin should be less than rmax.")
     xp = array_api_compat.array_namespace(distance)
-    distance = xp.clip(distance, min=rmin, max=rmax)
+    # Use where instead of clip so that make_fx tracing does not
+    # decompose it into boolean-indexed ops with data-dependent sizes.
+    distance = xp.where(distance < rmin, rmin * xp.ones_like(distance), distance)
+    distance = xp.where(distance > rmax, rmax * xp.ones_like(distance), distance)
     uu = (distance - rmin) / (rmax - rmin)
     uu2 = uu * uu
     vv = uu2 * uu * (-6.0 * uu2 + 15.0 * uu - 10.0) + 1.0
@@ -42,7 +45,8 @@ def compute_exp_sw(
     if rmin >= rmax:
         raise ValueError("rmin should be less than rmax.")
     xp = array_api_compat.array_namespace(distance)
-    distance = xp.clip(distance, min=0.0, max=rmax)
+    distance = xp.where(distance < 0.0, xp.zeros_like(distance), distance)
+    distance = xp.where(distance > rmax, rmax * xp.ones_like(distance), distance)
     C = 20
     a = C / rmin
     b = rmin
diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 22f3db59e6..4c3e902917 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -103,6 +103,221 @@ def get_additional_data_requirement(_model: Any) -> list[DataRequirementItem]:
     return additional_data_requirement
 
 
+# ---------------------------------------------------------------------------
+# torch.compile helpers
+# ---------------------------------------------------------------------------
+
+
+def _trace_and_compile(
+    model: torch.nn.Module,
+    ext_coord: torch.Tensor,
+    ext_atype: torch.Tensor,
+    nlist: torch.Tensor,
+    mapping: torch.Tensor,
+    fparam: torch.Tensor | None,
+    aparam: torch.Tensor | None,
+    compile_opts: dict[str, Any],
+) -> torch.nn.Module:
+    """Trace ``forward_lower`` with ``make_fx`` and compile with ``torch.compile``.
+
+    Parameters
+    ----------
+    model : torch.nn.Module
+        The (uncompiled) model.  Temporarily set to eval mode for tracing.
+    ext_coord, ext_atype, nlist, mapping, fparam, aparam
+        Sample tensors (already padded to the desired max_nall).
+    compile_opts : dict
+        Options forwarded to ``torch.compile`` (excluding ``dynamic``).
+
+    Returns
+    -------
+    torch.nn.Module
+        The compiled ``forward_lower`` callable.
+    """
+    from torch.fx.experimental.proxy_tensor import (
+        make_fx,
+    )
+
+    was_training = model.training
+    model.eval()
+
+    def fn(
+        extended_coord: torch.Tensor,
+        extended_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor | None,
+        fparam: torch.Tensor | None,
+        aparam: torch.Tensor | None,
+    ) -> dict[str, torch.Tensor]:
+        extended_coord = extended_coord.detach().requires_grad_(True)
+        return model.forward_lower(
+            extended_coord,
+            extended_atype,
+            nlist,
+            mapping,
+            fparam=fparam,
+            aparam=aparam,
+        )
+
+    # Use default tracing_mode="real" (concrete shapes) for best
+    # runtime performance.  If data-dependent intermediate shapes
+    # change at runtime, the caller catches the error and retraces.
+    traced_lower = make_fx(fn)(ext_coord, ext_atype, nlist, mapping, fparam, aparam)
+
+    if was_training:
+        model.train()
+
+    compiled_lower = torch.compile(traced_lower, dynamic=False, **compile_opts)
+    return compiled_lower
+
+
+class _CompiledModel(torch.nn.Module):
+    """Coord extension (eager) -> pad nall -> compiled forward_lower.
+
+    If a batch's ``nall`` exceeds the current ``max_nall``, the model is
+    automatically re-traced and recompiled with a larger pad size.
+    """
+
+    def __init__(
+        self,
+        original_model: torch.nn.Module,
+        compiled_forward_lower: torch.nn.Module,
+        max_nall: int,
+        compile_opts: dict[str, Any],
+    ) -> None:
+        super().__init__()
+        self.original_model = original_model
+        self.compiled_forward_lower = compiled_forward_lower
+        self._max_nall = max_nall
+        self._compile_opts = compile_opts
+
+    def _recompile(
+        self,
+        ext_coord: torch.Tensor,
+        ext_atype: torch.Tensor,
+        nlist: torch.Tensor,
+        mapping: torch.Tensor,
+        fparam: torch.Tensor | None,
+        aparam: torch.Tensor | None,
+        new_max_nall: int,
+    ) -> None:
+        """Re-trace and recompile for the given inputs.
+
+        If *new_max_nall* differs from the current ``_max_nall``, the
+        inputs are padded (or already padded by the caller).
+        """
+        # Pad if the caller provides unpadded tensors (nall growth case)
+        actual_nall = ext_coord.shape[1]
+        pad_n = new_max_nall - actual_nall
+        if pad_n > 0:
+            ext_coord = torch.nn.functional.pad(ext_coord, (0, 0, 0, pad_n))
+            ext_atype = torch.nn.functional.pad(ext_atype, (0, pad_n))
+            mapping = torch.nn.functional.pad(mapping, (0, pad_n))
+
+        ext_coord = ext_coord.detach()
+
+        self.compiled_forward_lower = _trace_and_compile(
+            self.original_model,
+            ext_coord,
+            ext_atype,
+            nlist,
+            mapping,
+            fparam,
+            aparam,
+            self._compile_opts,
+        )
+        self._max_nall = new_max_nall
+        log.info(
+            "Recompiled model with max_nall=%d.",
+            new_max_nall,
+        )
+
+    def forward(
+        self,
+        coord: torch.Tensor,
+        atype: torch.Tensor,
+        box: torch.Tensor | None = None,
+        fparam: torch.Tensor | None = None,
+        aparam: torch.Tensor | None = None,
+        do_atomic_virial: bool = False,
+    ) -> dict[str, torch.Tensor]:
+        from deepmd.dpmodel.utils.nlist import (
+            build_neighbor_list,
+            extend_coord_with_ghosts,
+        )
+        from deepmd.dpmodel.utils.region import (
+            normalize_coord,
+        )
+
+        nframes, nloc = atype.shape[:2]
+        rcut = self.original_model.get_rcut()
+        sel = self.original_model.get_sel()
+
+        # coord extension + nlist (data-dependent, run in eager)
+        coord_3d = coord.detach().reshape(nframes, nloc, 3)
+        box_flat = box.detach().reshape(nframes, 9) if box is not None else None
+
+        if box_flat is not None:
+            coord_norm = normalize_coord(coord_3d, box_flat.reshape(nframes, 3, 3))
+        else:
+            coord_norm = coord_3d
+
+        ext_coord, ext_atype, mapping = extend_coord_with_ghosts(
+            coord_norm, atype, box_flat, rcut
+        )
+        nlist = build_neighbor_list(
+            ext_coord,
+            ext_atype,
+            nloc,
+            rcut,
+            sel,
+            distinguish_types=False,
+        )
+        ext_coord = ext_coord.reshape(nframes, -1, 3)
+
+        # Grow max_nall if needed (retrace + recompile)
+        actual_nall = ext_coord.shape[1]
+        if actual_nall > self._max_nall:
+            new_max_nall = ((int(actual_nall * 1.2) + 7) // 8) * 8
+            log.info(
+                "nall=%d exceeds max_nall=%d; recompiling with max_nall=%d.",
+                actual_nall,
+                self._max_nall,
+                new_max_nall,
+            )
+            self._recompile(
+                ext_coord, ext_atype, nlist, mapping, fparam, aparam, new_max_nall
+            )
+
+        # Pad to max_nall so compiled graph sees a fixed shape
+        pad_n = self._max_nall - actual_nall
+        if pad_n > 0:
+            ext_coord = torch.nn.functional.pad(ext_coord, (0, 0, 0, pad_n))
+            ext_atype = torch.nn.functional.pad(ext_atype, (0, pad_n))
+            mapping = torch.nn.functional.pad(mapping, (0, pad_n))
+        ext_coord = ext_coord.detach().requires_grad_(True)
+
+        result = self.compiled_forward_lower(
+            ext_coord, ext_atype, nlist, mapping, fparam, aparam
+        )
+
+        # Translate forward_lower keys -> forward keys
+        out: dict[str, torch.Tensor] = {}
+        out["atom_energy"] = result["atom_energy"]
+        out["energy"] = result["energy"]
+        if "extended_force" in result:
+            out["force"] = result["extended_force"][:, :nloc, :]
+        if "virial" in result:
+            out["virial"] = result["virial"]
+        if "extended_virial" in result:
+            out["extended_virial"] = result["extended_virial"]
+        if "atom_virial" in result:
+            out["atom_virial"] = result["atom_virial"]
+        if "mask" in result:
+            out["mask"] = result["mask"]
+        return out
+
+
 # ---------------------------------------------------------------------------
 # Trainer
 # ---------------------------------------------------------------------------
@@ -283,11 +498,17 @@ def _compile_model(self, compile_opts: dict[str, Any]) -> None:
         computation) with ``create_graph=True``, which creates a "double
         backward" that ``torch.compile`` cannot handle.
 
-        Solution: use ``forward_lower_exportable`` (``make_fx`` trace) to
-        decompose ``torch.autograd.grad`` into primitive ops.  The coord
-        extension + nlist build (which contain data-dependent control flow)
-        are kept outside the compiled region.  The traced ``forward_lower``
-        module is then compiled by ``torch.compile``.
+        Solution: use ``make_fx`` to trace ``forward_lower``, decomposing
+        ``torch.autograd.grad`` into primitive ops.  The coord extension +
+        nlist build (data-dependent control flow) are kept outside the
+        compiled region.
+
+        To avoid the overhead of symbolic tracing and dynamic shapes, the
+        extended-atom dimension (nall) is padded to a fixed maximum
+        estimated from the training data.  This allows concrete-shape
+        tracing and ``dynamic=False``.  If a batch exceeds the current
+        max_nall at runtime, the model is automatically re-traced and
+        recompiled with a larger pad size.
         """
         from deepmd.dpmodel.utils.nlist import (
             build_neighbor_list,
@@ -299,36 +520,76 @@ def _compile_model(self, compile_opts: dict[str, Any]) -> None:
 
         model = self.model
 
-        # --- Build sample extended inputs for tracing ---
-        sample_input, _ = self.get_data(is_train=True)
-        coord = sample_input["coord"].detach()
-        atype = sample_input["atype"].detach()
-        box = sample_input.get("box")
-        if box is not None:
-            box = box.detach()
-
-        nframes, nloc = atype.shape[:2]
-        coord_np = coord.cpu().numpy().reshape(nframes, nloc, 3)
-        atype_np = atype.cpu().numpy()
-        box_np = box.cpu().numpy().reshape(nframes, 9) if box is not None else None
+        # --- Estimate max_nall by sampling multiple batches ---
+        n_sample = 20
+        max_nall = 0
+        best_sample: (
+            tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray, int, dict] | None
+        ) = None
+
+        for _ii in range(n_sample):
+            inp, _ = self.get_data(is_train=True)
+            coord = inp["coord"].detach()
+            atype = inp["atype"].detach()
+            box = inp.get("box")
+            if box is not None:
+                box = box.detach()
+
+            nframes, nloc = atype.shape[:2]
+            coord_np = coord.cpu().numpy().reshape(nframes, nloc, 3)
+            atype_np = atype.cpu().numpy()
+            box_np = box.cpu().numpy().reshape(nframes, 9) if box is not None else None
+
+            if box_np is not None:
+                coord_norm = normalize_coord(coord_np, box_np.reshape(nframes, 3, 3))
+            else:
+                coord_norm = coord_np
 
-        if box_np is not None:
-            coord_norm = normalize_coord(coord_np, box_np.reshape(nframes, 3, 3))
-        else:
-            coord_norm = coord_np
+            ext_coord_np, ext_atype_np, mapping_np = extend_coord_with_ghosts(
+                coord_norm, atype_np, box_np, model.get_rcut()
+            )
+            nlist_np = build_neighbor_list(
+                ext_coord_np,
+                ext_atype_np,
+                nloc,
+                model.get_rcut(),
+                model.get_sel(),
+                distinguish_types=False,
+            )
+            ext_coord_np = ext_coord_np.reshape(nframes, -1, 3)
+            nall = ext_coord_np.shape[1]
+            if nall > max_nall:
+                max_nall = nall
+                best_sample = (
+                    ext_coord_np,
+                    ext_atype_np,
+                    mapping_np,
+                    nlist_np,
+                    nloc,
+                    inp,
+                )
 
-        ext_coord_np, ext_atype_np, mapping_np = extend_coord_with_ghosts(
-            coord_norm, atype_np, box_np, model.get_rcut()
+        # Add 20 % margin and round up to a multiple of 8.
+        max_nall = ((int(max_nall * 1.2) + 7) // 8) * 8
+        log.info(
+            "Estimated max_nall=%d for compiled model (sampled %d batches).",
+            max_nall,
+            n_sample,
         )
-        nlist_np = build_neighbor_list(
-            ext_coord_np,
-            ext_atype_np,
-            nloc,
-            model.get_rcut(),
-            model.get_sel(),
-            distinguish_types=False,
+
+        # --- Pad the largest sample to max_nall and trace ---
+        assert best_sample is not None
+        ext_coord_np, ext_atype_np, mapping_np, nlist_np, nloc, sample_input = (
+            best_sample
         )
-        ext_coord_np = ext_coord_np.reshape(nframes, -1, 3)
+        nframes = ext_coord_np.shape[0]
+        actual_nall = ext_coord_np.shape[1]
+        pad_n = max_nall - actual_nall
+
+        if pad_n > 0:
+            ext_coord_np = np.pad(ext_coord_np, ((0, 0), (0, pad_n), (0, 0)))
+            ext_atype_np = np.pad(ext_atype_np, ((0, 0), (0, pad_n)))
+            mapping_np = np.pad(mapping_np, ((0, 0), (0, pad_n)))
 
         ext_coord = torch.tensor(
             ext_coord_np, dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
@@ -339,133 +600,26 @@ def _compile_model(self, compile_opts: dict[str, Any]) -> None:
         fparam = sample_input.get("fparam")
         aparam = sample_input.get("aparam")
 
-        # --- Trace forward_lower with make_fx ---
-        # Tracing must happen in eval mode (create_graph=False) to avoid
-        # double-backward complexity that make_fx cannot handle.
-        # The traced module still produces correct force *values*; we just
-        # don't need create_graph=True because torch.compile handles the
-        # backward pass through the traced primitive ops.
-        #
-        # Use tracing_mode="symbolic" so that nall (number of extended
-        # atoms) is treated as a dynamic dimension — different batches may
-        # have different numbers of ghost atoms.
-        from torch.fx.experimental.proxy_tensor import (
-            make_fx,
+        compile_opts.pop("dynamic", None)  # always False for padded approach
+
+        compiled_lower = _trace_and_compile(
+            model,
+            ext_coord,
+            ext_atype,
+            nlist_t,
+            mapping_t,
+            fparam,
+            aparam,
+            compile_opts,
         )
 
-        model.eval()
-
-        def fn(
-            extended_coord: torch.Tensor,
-            extended_atype: torch.Tensor,
-            nlist: torch.Tensor,
-            mapping: torch.Tensor | None,
-            fparam: torch.Tensor | None,
-            aparam: torch.Tensor | None,
-        ) -> dict[str, torch.Tensor]:
-            extended_coord = extended_coord.detach().requires_grad_(True)
-            return model.forward_lower(
-                extended_coord,
-                extended_atype,
-                nlist,
-                mapping,
-                fparam=fparam,
-                aparam=aparam,
-            )
-
-        traced_lower = make_fx(
-            fn,
-            tracing_mode="symbolic",
-            _allow_non_fake_inputs=True,
-        )(ext_coord, ext_atype, nlist_t, mapping_t, fparam, aparam)
-        model.train()
-
-        # --- Compile the traced module ---
-        # nall (number of extended atoms) varies per batch, so enable
-        # dynamic shapes to avoid recompilation on every shape change.
-        compile_opts.setdefault("dynamic", True)
-        compiled_lower = torch.compile(traced_lower, **compile_opts)
-
-        # --- Build a wrapper that does coord-extension then compiled lower ---
-        class _CompiledModel(torch.nn.Module):
-            """Thin wrapper: coord extension (untraced) → compiled forward_lower."""
-
-            def __init__(
-                self,
-                original_model: torch.nn.Module,
-                compiled_forward_lower: torch.nn.Module,
-            ) -> None:
-                super().__init__()
-                self.original_model = original_model
-                self.compiled_forward_lower = compiled_forward_lower
-
-            def forward(
-                self,
-                coord: torch.Tensor,
-                atype: torch.Tensor,
-                box: torch.Tensor | None = None,
-                fparam: torch.Tensor | None = None,
-                aparam: torch.Tensor | None = None,
-                do_atomic_virial: bool = False,
-            ) -> dict[str, torch.Tensor]:
-                nframes, nloc = atype.shape[:2]
-                rcut = self.original_model.get_rcut()
-                sel = self.original_model.get_sel()
-
-                # coord extension + nlist (data-dependent, run in eager on device)
-                coord_3d = coord.detach().reshape(nframes, nloc, 3)
-                box_flat = box.detach().reshape(nframes, 9) if box is not None else None
-
-                if box_flat is not None:
-                    coord_norm = normalize_coord(
-                        coord_3d, box_flat.reshape(nframes, 3, 3)
-                    )
-                else:
-                    coord_norm = coord_3d
-
-                ext_coord, ext_atype, mapping = extend_coord_with_ghosts(
-                    coord_norm, atype, box_flat, rcut
-                )
-                nlist = build_neighbor_list(
-                    ext_coord,
-                    ext_atype,
-                    nloc,
-                    rcut,
-                    sel,
-                    distinguish_types=False,
-                )
-                ext_coord = ext_coord.reshape(nframes, -1, 3)
-                ext_coord = ext_coord.detach().requires_grad_(True)
-
-                # compiled forward_lower (autograd decomposed, no double backward)
-                result = self.compiled_forward_lower(
-                    ext_coord,
-                    ext_atype,
-                    nlist,
-                    mapping,
-                    fparam,
-                    aparam,
-                )
-
-                # Translate forward_lower keys → forward keys
-                out: dict[str, torch.Tensor] = {}
-                out["atom_energy"] = result["atom_energy"]
-                out["energy"] = result["energy"]
-                if "extended_force" in result:
-                    # extract local atoms only: [nf, nall, 3] → [nf, nloc, 3]
-                    out["force"] = result["extended_force"][:, :nloc, :]
-                if "virial" in result:
-                    out["virial"] = result["virial"]
-                if "extended_virial" in result:
-                    out["extended_virial"] = result["extended_virial"]
-                if "atom_virial" in result:
-                    out["atom_virial"] = result["atom_virial"]
-                if "mask" in result:
-                    out["mask"] = result["mask"]
-                return out
-
-        self.wrapper.model = _CompiledModel(model, compiled_lower)
-        log.info("Model traced with make_fx and compiled with torch.compile.")
+        self.wrapper.model = _CompiledModel(
+            model, compiled_lower, max_nall, compile_opts
+        )
+        log.info(
+            "Model compiled with padded nall=%d (tracing_mode=real, dynamic=False).",
+            max_nall,
+        )
 
     # ------------------------------------------------------------------
     # Data helpers
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 8b3198bf96..dd9cdda5b0 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -167,6 +167,74 @@ def test_training_loop_compiled(self) -> None:
         self._run_training(config)
 
 
+class TestCompiledRecompile(unittest.TestCase):
+    """Test that _CompiledModel recompiles when nall exceeds max_nall."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def test_nall_growth_triggers_recompile(self) -> None:
+        """Shrink max_nall to force a recompile, then verify training works."""
+        from deepmd.pt_expt.train.training import (
+            _CompiledModel,
+        )
+
+        config = _make_config(self.data_dir, numb_steps=5)
+        config["training"]["enable_compile"] = True
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_recompile_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                trainer = get_trainer(config)
+
+                # The wrapper.model should be a _CompiledModel
+                compiled_model = trainer.wrapper.model
+                self.assertIsInstance(compiled_model, _CompiledModel)
+
+                original_max_nall = compiled_model._max_nall
+                self.assertGreater(original_max_nall, 0)
+
+                # Artificially shrink max_nall to 1 so the next batch
+                # will certainly exceed it and trigger recompilation.
+                compiled_model._max_nall = 1
+                old_compiled_lower = compiled_model.compiled_forward_lower
+
+                # Run one training step — should trigger recompile
+                trainer.wrapper.train()
+                trainer.optimizer.zero_grad(set_to_none=True)
+                inp, lab = trainer.get_data(is_train=True)
+                lr = trainer.scheduler.get_last_lr()[0]
+                _, loss, more_loss = trainer.wrapper(**inp, cur_lr=lr, label=lab)
+                loss.backward()
+                trainer.optimizer.step()
+
+                # max_nall should have grown beyond 1
+                new_max_nall = compiled_model._max_nall
+                self.assertGreater(new_max_nall, 1)
+
+                # compiled_forward_lower should be a new object
+                self.assertIsNot(
+                    compiled_model.compiled_forward_lower,
+                    old_compiled_lower,
+                )
+
+                # Loss should be a finite scalar
+                self.assertFalse(torch.isnan(loss))
+                self.assertFalse(torch.isinf(loss))
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
 class TestGetData(unittest.TestCase):
     """Test the batch data conversion in Trainer.get_data."""
 

From 4e8003a3e140f5146ecb905ad38c2e379aee2f98 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Thu, 26 Feb 2026 23:32:47 +0800
Subject: [PATCH 46/63] more robust stat

---
 deepmd/dpmodel/utils/env_mat_stat.py | 7 ++++---
 deepmd/pt_expt/utils/stat.py         | 7 +------
 2 files changed, 5 insertions(+), 9 deletions(-)

diff --git a/deepmd/dpmodel/utils/env_mat_stat.py b/deepmd/dpmodel/utils/env_mat_stat.py
index 37a69ea1b1..7f49a5310e 100644
--- a/deepmd/dpmodel/utils/env_mat_stat.py
+++ b/deepmd/dpmodel/utils/env_mat_stat.py
@@ -134,6 +134,7 @@ def iter(
                 system["box"],
                 system["natoms"],
             )
+            nframes, nloc = atype.shape[:2]
             (
                 extended_coord,
                 extended_atype,
@@ -170,12 +171,12 @@ def iter(
             env_mat = xp.reshape(
                 env_mat,
                 (
-                    coord.shape[0] * coord.shape[1],
+                    nframes * nloc,
                     self.descriptor.get_nsel(),
                     self.last_dim,
                 ),
             )
-            atype = xp.reshape(atype, (coord.shape[0] * coord.shape[1],))
+            atype = xp.reshape(atype, (nframes * nloc,))
             # (1, nloc) eq (ntypes, 1), so broadcast is possible
             # shape: (ntypes, nloc)
             type_idx = xp.equal(
@@ -200,7 +201,7 @@ def iter(
                 # shape: (1, nloc, nnei)
                 exclude_mask = xp.reshape(
                     pair_exclude_mask.build_type_exclude_mask(nlist, extended_atype),
-                    (1, coord.shape[0] * coord.shape[1], -1),
+                    (1, nframes * nloc, -1),
                 )
                 # shape: (ntypes, nloc, nnei)
                 type_idx = xp.logical_and(type_idx[..., None], exclude_mask)
diff --git a/deepmd/pt_expt/utils/stat.py b/deepmd/pt_expt/utils/stat.py
index 50044f8028..045c8f7ce5 100644
--- a/deepmd/pt_expt/utils/stat.py
+++ b/deepmd/pt_expt/utils/stat.py
@@ -66,15 +66,10 @@ def make_stat_input(
         if "type" in merged and "atype" not in merged:
             merged["atype"] = merged.pop("type")
 
-        # Reshape coord from [nf, natoms*3] → [nf, natoms, 3]
-        if "atype" in merged and "coord" in merged:
-            natoms = merged["atype"].shape[-1]
-            merged["coord"] = merged["coord"].reshape(-1, natoms, 3)
-
         # Provide "natoms" from "natoms_vec" (expected by stat system).
         # natoms_vec from get_batch() is 1D [2+ntypes], but
         # compute_output_stats expects 2D [nframes, 2+ntypes].
-        if "natoms_vec" in merged and "natoms" not in merged:
+        if "natoms_vec" in merged:
             nv = merged["natoms_vec"]
             if nv.ndim == 1:
                 nframes = merged["coord"].shape[0]

From 04ed4cba2e476ccd3958877fe5a2732ac6b6aac3 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 10:14:21 +0800
Subject: [PATCH 47/63] refactor: unify make_stat_input and validate
 fparam/aparam in stat

  - Move pt_expt's make_stat_input into deepmd/utils/model_stat.py as a
    backend-agnostic function (numpy-based). pt_expt re-exports it.
  - Rename old make_stat_input to collect_batches (used by TF backend).
  - Make EnvMatStatSe robust to coord shape conventions by deriving
    nframes/nloc from atype.shape instead of coord.shape.
  - In _make_wrapped_sampler, fill default fparam for systems with
    find_fparam==0 and set find_fparam to 1.0.
  - In compute_input_stats, validate that find_fparam/find_aparam is
    present and 1.0 when numb_fparam/numb_aparam > 0.
  - Add consistency tests comparing universal and pt make_stat_input
    for normal, mixed-type, fparam/aparam, and spin data.
---
 .../dpmodel/atomic_model/base_atomic_model.py |  21 +-
 deepmd/dpmodel/fitting/general_fitting.py     |  22 ++
 deepmd/pt_expt/utils/stat.py                  |  80 +---
 deepmd/tf/model/model_stat.py                 |   4 +-
 deepmd/utils/model_stat.py                    |  77 +++-
 .../tests/consistent/test_make_stat_input.py  | 370 ++++++++++++++++++
 6 files changed, 483 insertions(+), 91 deletions(-)
 create mode 100644 source/tests/consistent/test_make_stat_input.py

diff --git a/deepmd/dpmodel/atomic_model/base_atomic_model.py b/deepmd/dpmodel/atomic_model/base_atomic_model.py
index ecfd08b61a..99d8a2dc99 100644
--- a/deepmd/dpmodel/atomic_model/base_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/base_atomic_model.py
@@ -332,19 +332,22 @@ def wrapped_sampler() -> list[dict]:
                 atom_exclude_types = self.atom_excl.get_exclude_types()
                 for sample in sampled:
                     sample["atom_exclude_types"] = list(atom_exclude_types)
-            if (
-                "find_fparam" not in sampled[0]
-                and "fparam" not in sampled[0]
-                and self.has_default_fparam()
-            ):
+            # For systems where fparam is missing (find_fparam == 0),
+            # fill with default fparam if available and mark as found.
+            if self.has_default_fparam():
                 default_fparam = self.get_default_fparam()
                 if default_fparam is not None:
                     default_fparam_np = np.array(default_fparam)
                     for sample in sampled:
-                        nframe = sample["atype"].shape[0]
-                        sample["fparam"] = np.tile(
-                            default_fparam_np.reshape(1, -1), (nframe, 1)
-                        )
+                        if (
+                            "find_fparam" in sample
+                            and float(sample["find_fparam"]) == 0.0
+                        ):
+                            nframe = sample["atype"].shape[0]
+                            sample["fparam"] = np.tile(
+                                default_fparam_np.reshape(1, -1), (nframe, 1)
+                            )
+                            sample["find_fparam"] = np.float32(1.0)
             return sampled
 
         return wrapped_sampler
diff --git a/deepmd/dpmodel/fitting/general_fitting.py b/deepmd/dpmodel/fitting/general_fitting.py
index c7372f05ac..f1ac86dde8 100644
--- a/deepmd/dpmodel/fitting/general_fitting.py
+++ b/deepmd/dpmodel/fitting/general_fitting.py
@@ -266,6 +266,17 @@ def compute_input_stats(
                 )
             else:
                 sampled = merged() if callable(merged) else merged
+                for ii, frame in enumerate(sampled):
+                    if "find_fparam" not in frame:
+                        raise ValueError(
+                            f"numb_fparam > 0 but fparam is not acquired "
+                            f"for system {ii}."
+                        )
+                    if float(frame["find_fparam"]) != 1.0:
+                        raise ValueError(
+                            f"numb_fparam > 0 but no fparam data is provided "
+                            f"for system {ii}."
+                        )
                 cat_data = np.concatenate(
                     [frame["fparam"] for frame in sampled], axis=0
                 )
@@ -313,6 +324,17 @@ def compute_input_stats(
                 )
             else:
                 sampled = merged() if callable(merged) else merged
+                for ii, frame in enumerate(sampled):
+                    if "find_aparam" not in frame:
+                        raise ValueError(
+                            f"numb_aparam > 0 but aparam is not acquired "
+                            f"for system {ii}."
+                        )
+                    if float(frame["find_aparam"]) != 1.0:
+                        raise ValueError(
+                            f"numb_aparam > 0 but no aparam data is provided "
+                            f"for system {ii}."
+                        )
                 sys_sumv = []
                 sys_sumv2 = []
                 sys_sumn = []
diff --git a/deepmd/pt_expt/utils/stat.py b/deepmd/pt_expt/utils/stat.py
index 045c8f7ce5..0a22ba4404 100644
--- a/deepmd/pt_expt/utils/stat.py
+++ b/deepmd/pt_expt/utils/stat.py
@@ -1,80 +1,6 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
-import logging
-
-import numpy as np
-
-from deepmd.utils.data_system import (
-    DeepmdDataSystem,
+from deepmd.utils.model_stat import (
+    make_stat_input,
 )
-from deepmd.utils.model_stat import make_stat_input as _make_stat_input_raw
-
-log = logging.getLogger(__name__)
-
-
-def make_stat_input(
-    data: DeepmdDataSystem,
-    nbatches: int,
-) -> list[dict[str, np.ndarray]]:
-    """Pack data for statistics using DeepmdDataSystem.
-
-    Collects *nbatches* batches from each system and concatenates them
-    into a single dict per system.  The returned format matches the
-    ``list[dict[str, np.ndarray]]`` expected by
-    ``compute_or_load_stat``.
-
-    Parameters
-    ----------
-    data : DeepmdDataSystem
-        The multi-system data manager.
-    nbatches : int
-        Number of batches to collect per system.
-
-    Returns
-    -------
-    list[dict[str, np.ndarray]]
-        Per-system dicts with concatenated numpy arrays.
-    """
-    # Reuse the shared helper with merge_sys=False so that data is
-    # grouped by system:  all_stat[key][sys_idx] = [batch0, batch1, ...]
-    all_stat = _make_stat_input_raw(data, nbatches, merge_sys=False)
-
-    nsystems = data.get_nsystems()
-    log.info(f"Packing data for statistics from {nsystems} systems")
-
-    # Transpose dict-of-lists-of-lists → list-of-dicts and concatenate
-    # batches within each system.
-    keys = list(all_stat.keys())
-    lst: list[dict[str, np.ndarray]] = []
-    for ii in range(nsystems):
-        merged: dict[str, np.ndarray] = {}
-        for key in keys:
-            vals = all_stat[key][ii]  # list of batch arrays for this system
-            if isinstance(vals[0], np.ndarray):
-                if vals[0].ndim >= 2:
-                    # 2D+ arrays (e.g. coord [nf, natoms*3]) — concat along axis 0
-                    merged[key] = np.concatenate(vals, axis=0)
-                else:
-                    # 1D arrays (e.g. natoms_vec [2+ntypes]) — per-system
-                    # constant, just keep one copy
-                    merged[key] = vals[0]
-            else:
-                # scalar flags like find_*
-                merged[key] = vals[0]
-
-        # DeepmdDataSystem.get_batch() uses "type" but the stat system
-        # (env_mat_stat, compute_output_stats, etc.) expects "atype".
-        if "type" in merged and "atype" not in merged:
-            merged["atype"] = merged.pop("type")
-
-        # Provide "natoms" from "natoms_vec" (expected by stat system).
-        # natoms_vec from get_batch() is 1D [2+ntypes], but
-        # compute_output_stats expects 2D [nframes, 2+ntypes].
-        if "natoms_vec" in merged:
-            nv = merged["natoms_vec"]
-            if nv.ndim == 1:
-                nframes = merged["coord"].shape[0]
-                nv = np.tile(nv, (nframes, 1))
-            merged["natoms"] = nv
 
-        lst.append(merged)
-    return lst
+__all__ = ["make_stat_input"]
diff --git a/deepmd/tf/model/model_stat.py b/deepmd/tf/model/model_stat.py
index 96c8b4a4af..1b0e8ab3a1 100644
--- a/deepmd/tf/model/model_stat.py
+++ b/deepmd/tf/model/model_stat.py
@@ -3,7 +3,9 @@
 
 from deepmd.utils.model_stat import (
     _make_all_stat_ref,
-    make_stat_input,
+)
+from deepmd.utils.model_stat import collect_batches as make_stat_input
+from deepmd.utils.model_stat import (
     merge_sys_stat,
 )
 
diff --git a/deepmd/utils/model_stat.py b/deepmd/utils/model_stat.py
index 8061c7aa9c..539681bdf4 100644
--- a/deepmd/utils/model_stat.py
+++ b/deepmd/utils/model_stat.py
@@ -1,4 +1,5 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+import logging
 from collections import (
     defaultdict,
 )
@@ -8,6 +9,8 @@
 
 import numpy as np
 
+log = logging.getLogger(__name__)
+
 
 def _make_all_stat_ref(data: Any, nbatches: int) -> dict[str, list[Any]]:
     all_stat = defaultdict(list)
@@ -21,17 +24,20 @@ def _make_all_stat_ref(data: Any, nbatches: int) -> dict[str, list[Any]]:
     return all_stat
 
 
-def make_stat_input(
+def collect_batches(
     data: Any, nbatches: int, merge_sys: bool = True
 ) -> dict[str, list[Any]]:
-    """Pack data for statistics.
+    """Collect batches from a DeepmdDataSystem into a dict of lists.
+
+    This is a low-level helper used by the TF backend and by
+    :func:`make_stat_input`.
 
     Parameters
     ----------
     data
-        The data
+        The data (must support ``get_nsystems()`` and ``get_batch(sys_idx=)``)
     nbatches : int
-        The number of batches
+        The number of batches per system
     merge_sys : bool (True)
         Merge system data
 
@@ -62,6 +68,69 @@ def make_stat_input(
     return all_stat
 
 
+def make_stat_input(
+    data: Any,
+    nbatches: int,
+) -> list[dict[str, np.ndarray]]:
+    """Pack data for statistics using DeepmdDataSystem.
+
+    Collects *nbatches* batches from each system and concatenates them
+    into a single dict per system.  The returned format
+    (``list[dict[str, np.ndarray]]``) is backend-agnostic and can be
+    consumed by ``compute_or_load_stat`` in dpmodel, pt_expt, and jax.
+
+    Parameters
+    ----------
+    data
+        The multi-system data manager
+        (must support ``get_nsystems()`` and ``get_batch(sys_idx=)``).
+    nbatches : int
+        Number of batches to collect per system.
+
+    Returns
+    -------
+    list[dict[str, np.ndarray]]
+        Per-system dicts with concatenated numpy arrays.
+    """
+    all_stat = collect_batches(data, nbatches, merge_sys=False)
+
+    nsystems = data.get_nsystems()
+    log.info(f"Packing data for statistics from {nsystems} systems")
+
+    keys = list(all_stat.keys())
+    lst: list[dict[str, np.ndarray]] = []
+    for ii in range(nsystems):
+        merged: dict[str, np.ndarray] = {}
+        for key in keys:
+            vals = all_stat[key][ii]  # list of batch arrays for this system
+            if isinstance(vals[0], np.ndarray):
+                if vals[0].ndim >= 2:
+                    merged[key] = np.concatenate(vals, axis=0)
+                else:
+                    # 1D arrays (e.g. natoms_vec) — per-system constant
+                    merged[key] = vals[0]
+            else:
+                # scalar flags like find_*
+                merged[key] = vals[0]
+
+        # DeepmdDataSystem.get_batch() uses "type"; stat consumers expect "atype".
+        if "type" in merged and "atype" not in merged:
+            merged["atype"] = merged.pop("type")
+
+        # Provide "natoms" from "natoms_vec".
+        # natoms_vec from get_batch() is 1D [2+ntypes], but
+        # compute_output_stats expects 2D [nframes, 2+ntypes].
+        if "natoms_vec" in merged:
+            nv = merged["natoms_vec"]
+            if nv.ndim == 1:
+                nframes = merged["coord"].shape[0]
+                nv = np.tile(nv, (nframes, 1))
+            merged["natoms"] = nv
+
+        lst.append(merged)
+    return lst
+
+
 def merge_sys_stat(all_stat: dict[str, list[Any]]) -> dict[str, list[Any]]:
     first_key = next(iter(all_stat.keys()))
     nsys = len(all_stat[first_key])
diff --git a/source/tests/consistent/test_make_stat_input.py b/source/tests/consistent/test_make_stat_input.py
new file mode 100644
index 0000000000..973e209ed9
--- /dev/null
+++ b/source/tests/consistent/test_make_stat_input.py
@@ -0,0 +1,370 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Consistency test between universal make_stat_input and pt make_stat_input.
+
+The universal make_stat_input (deepmd.utils.model_stat) uses DeepmdDataSystem
+(numpy-based). The pt make_stat_input (deepmd.pt.utils.stat) uses DpLoaderSet +
+DataLoader (torch-based). This test verifies that both produce equivalent
+per-system stat dicts for the keys consumed by compute_or_load_stat.
+"""
+
+import os
+import unittest
+
+import numpy as np
+
+from deepmd.utils.argcheck import (
+    normalize,
+)
+from deepmd.utils.compat import (
+    update_deepmd_input,
+)
+from deepmd.utils.data import (
+    DataRequirementItem,
+)
+
+from .common import (
+    INSTALLED_PT,
+)
+
+TESTS_DIR = os.path.dirname(os.path.dirname(__file__))
+EXAMPLE_DIR = os.path.join(TESTS_DIR, "..", "..", "examples", "water")
+
+
+def _build_config(
+    systems: list[str],
+    type_map: list[str],
+    *,
+    data_stat_nbatch: int = 2,
+    numb_fparam: int = 0,
+    numb_aparam: int = 0,
+) -> dict:
+    config = {
+        "model": {
+            "type_map": type_map,
+            "descriptor": {
+                "type": "se_e2_a",
+                "sel": [6, 12],
+                "rcut_smth": 0.50,
+                "rcut": 3.00,
+                "neuron": [8, 16],
+                "resnet_dt": False,
+                "axis_neuron": 4,
+                "type_one_side": True,
+                "seed": 1,
+            },
+            "fitting_net": {
+                "neuron": [16, 16],
+                "resnet_dt": True,
+                "seed": 1,
+            },
+            "data_stat_nbatch": data_stat_nbatch,
+        },
+        "learning_rate": {
+            "type": "exp",
+            "decay_steps": 500,
+            "start_lr": 0.001,
+            "stop_lr": 3.51e-8,
+        },
+        "loss": {
+            "type": "ener",
+            "start_pref_e": 0.02,
+            "limit_pref_e": 1,
+            "start_pref_f": 1000,
+            "limit_pref_f": 1,
+            "start_pref_v": 0,
+            "limit_pref_v": 0,
+        },
+        "training": {
+            "training_data": {"systems": systems, "batch_size": 1},
+            "validation_data": {
+                "systems": systems[:1],
+                "batch_size": 1,
+                "numb_btch": 1,
+            },
+            "numb_steps": 1,
+            "seed": 10,
+            "disp_file": "lcurve.out",
+            "disp_freq": 99999,
+            "save_freq": 99999,
+        },
+    }
+    if numb_fparam > 0:
+        config["model"]["fitting_net"]["numb_fparam"] = numb_fparam
+    if numb_aparam > 0:
+        config["model"]["fitting_net"]["numb_aparam"] = numb_aparam
+    config = update_deepmd_input(config, warning=False)
+    config = normalize(config)
+    return config
+
+
+def _get_universal_stat(config: dict, data_requirement: list[DataRequirementItem]):
+    """Get stat using the universal make_stat_input (DeepmdDataSystem)."""
+    from deepmd.utils.data_system import (
+        DeepmdDataSystem,
+    )
+    from deepmd.utils.model_stat import (
+        make_stat_input,
+    )
+
+    model_params = config["model"]
+    training_params = config["training"]
+    systems = training_params["training_data"]["systems"]
+    nbatch = model_params.get("data_stat_nbatch", 10)
+
+    data = DeepmdDataSystem(
+        systems=systems,
+        batch_size=training_params["training_data"]["batch_size"],
+        test_size=1,
+        rcut=model_params["descriptor"]["rcut"],
+        type_map=model_params["type_map"],
+    )
+    for item in data_requirement:
+        data.add(
+            item.key,
+            item.ndof,
+            atomic=item.atomic,
+            must=item.must,
+            high_prec=item.high_prec,
+            type_sel=item.type_sel,
+            repeat=item.repeat,
+            default=item.default,
+            dtype=item.dtype,
+            output_natoms_for_type_sel=item.output_natoms_for_type_sel,
+        )
+
+    return make_stat_input(data, nbatch)
+
+
+def _get_pt_stat(config: dict, data_requirement: list[DataRequirementItem]):
+    """Get stat using the pt make_stat_input (DpLoaderSet + DataLoader)."""
+    from deepmd.pt.utils.dataloader import (
+        DpLoaderSet,
+    )
+    from deepmd.pt.utils.stat import (
+        make_stat_input,
+    )
+
+    model_params = config["model"]
+    training_params = config["training"]
+    systems = training_params["training_data"]["systems"]
+    nbatch = model_params.get("data_stat_nbatch", 10)
+
+    loader = DpLoaderSet(
+        systems,
+        training_params["training_data"]["batch_size"],
+        model_params["type_map"],
+        seed=10,
+    )
+    for item in data_requirement:
+        loader.add_data_requirement([item])
+
+    return make_stat_input(loader.systems, loader.dataloaders, nbatch)
+
+
+def _to_numpy(val):
+    """Convert torch.Tensor or np.ndarray to numpy."""
+    import torch
+
+    if isinstance(val, torch.Tensor):
+        return val.detach().cpu().numpy()
+    return val
+
+
+def _compare_stat(
+    test_case: unittest.TestCase,
+    universal_stat: list[dict],
+    pt_stat: list[dict],
+    check_keys: list[str],
+) -> None:
+    """Compare universal and pt stat outputs for the given keys.
+
+    Verifies structural equivalence: same number of systems, same key
+    presence, matching find_* flags, consistent nframes, and consistent
+    per-frame sizes.
+    """
+    test_case.assertEqual(len(universal_stat), len(pt_stat))
+    for sys_idx in range(len(universal_stat)):
+        for key in check_keys:
+            in_uni = key in universal_stat[sys_idx]
+            in_pt = key in pt_stat[sys_idx]
+            # pt pops fparam/find_fparam when find_fparam==0 but
+            # universal keeps them. Skip when find_* is 0.
+            if in_uni and not in_pt:
+                find_key = f"find_{key}" if not key.startswith("find_") else key
+                find_val = universal_stat[sys_idx].get(find_key, None)
+                if find_val is not None and float(find_val) == 0.0:
+                    continue
+            test_case.assertEqual(
+                in_uni, in_pt, f"system {sys_idx}: key '{key}' presence mismatch"
+            )
+            if not in_uni:
+                continue
+
+            v_uni = _to_numpy(universal_stat[sys_idx][key])
+            v_pt = _to_numpy(pt_stat[sys_idx][key])
+
+            if key.startswith("find_"):
+                test_case.assertEqual(
+                    float(np.ravel(v_uni)[0]),
+                    float(np.ravel(v_pt)[0]),
+                    f"system {sys_idx}, key '{key}': find flag mismatch",
+                )
+                continue
+
+            v_uni = np.asarray(v_uni, dtype=np.float64)
+            v_pt = np.asarray(v_pt, dtype=np.float64)
+
+            nf_uni = v_uni.shape[0] if v_uni.ndim >= 2 else 1
+            nf_pt = v_pt.shape[0] if v_pt.ndim >= 2 else 1
+            test_case.assertEqual(
+                nf_uni,
+                nf_pt,
+                f"system {sys_idx}, key '{key}': nframes mismatch",
+            )
+            # coord shape differs: universal [nf, natoms*3], pt [nf, natoms, 3].
+            # Compare per-frame size.
+            test_case.assertEqual(
+                v_uni.size // max(nf_uni, 1),
+                v_pt.size // max(nf_pt, 1),
+                f"system {sys_idx}, key '{key}': per-frame size mismatch "
+                f"(uni shape {v_uni.shape}, pt shape {v_pt.shape})",
+            )
+
+
+# --- Standard data requirements for energy model ---
+_ENER_DATA_REQ = [
+    DataRequirementItem("energy", 1, atomic=False, must=False, high_prec=True),
+    DataRequirementItem("force", 3, atomic=True, must=False, high_prec=False),
+]
+
+_COMMON_CHECK_KEYS = [
+    "atype",
+    "box",
+    "coord",
+    "energy",
+    "natoms",
+    "find_energy",
+    "find_force",
+]
+
+
+@unittest.skipUnless(INSTALLED_PT, "PyTorch backend not installed")
+class TestMakeStatInputNormal(unittest.TestCase):
+    """Test with normal (non-mixed-type) water data, multiple systems."""
+
+    def test_consistency(self) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            self.skipTest(f"Example data not found: {data_dir}")
+
+        systems = [
+            os.path.join(data_dir, "data_0"),
+            os.path.join(data_dir, "data_1"),
+        ]
+        config = _build_config(systems, ["O", "H"])
+
+        universal_stat = _get_universal_stat(config, _ENER_DATA_REQ)
+        pt_stat = _get_pt_stat(config, _ENER_DATA_REQ)
+
+        self.assertEqual(len(universal_stat), 2)
+        _compare_stat(self, universal_stat, pt_stat, _COMMON_CHECK_KEYS)
+
+
+@unittest.skipUnless(INSTALLED_PT, "PyTorch backend not installed")
+class TestMakeStatInputMixedType(unittest.TestCase):
+    """Test with mixed-type data."""
+
+    def test_consistency(self) -> None:
+        data_dir = os.path.join(TESTS_DIR, "tf", "finetune", "data_mixed_type")
+        if not os.path.isdir(data_dir):
+            self.skipTest(f"Mixed-type data not found: {data_dir}")
+
+        config = _build_config([data_dir], ["O", "H"])
+
+        universal_stat = _get_universal_stat(config, _ENER_DATA_REQ)
+        pt_stat = _get_pt_stat(config, _ENER_DATA_REQ)
+
+        _compare_stat(
+            self,
+            universal_stat,
+            pt_stat,
+            [*_COMMON_CHECK_KEYS, "real_natoms_vec"],
+        )
+
+        # For mixed-type data, real_natoms_vec is the per-frame version.
+        # Verify it is present in the universal output.
+        for sys_idx in range(len(universal_stat)):
+            self.assertIn(
+                "real_natoms_vec",
+                universal_stat[sys_idx],
+                f"system {sys_idx}: real_natoms_vec should be present "
+                f"for mixed-type data",
+            )
+
+
+@unittest.skipUnless(INSTALLED_PT, "PyTorch backend not installed")
+class TestMakeStatInputFparamAparam(unittest.TestCase):
+    """Test with data containing fparam and aparam, multiple systems."""
+
+    def test_consistency(self) -> None:
+        data_dir = os.path.join(TESTS_DIR, "pt", "model", "water", "data")
+        if not os.path.isdir(data_dir):
+            self.skipTest(f"Water fparam data not found: {data_dir}")
+
+        # data_0 has fparam/aparam, data_1 does not — tests find_fparam=0 case
+        systems = [
+            os.path.join(data_dir, "data_0"),
+            os.path.join(data_dir, "data_1"),
+        ]
+        config = _build_config(systems, ["O", "H"], numb_fparam=2, numb_aparam=1)
+
+        data_requirement = [
+            *_ENER_DATA_REQ,
+            DataRequirementItem("fparam", 2, atomic=False, must=False, high_prec=False),
+            DataRequirementItem("aparam", 1, atomic=True, must=False, high_prec=False),
+        ]
+        universal_stat = _get_universal_stat(config, data_requirement)
+        pt_stat = _get_pt_stat(config, data_requirement)
+
+        self.assertEqual(len(universal_stat), 2)
+        _compare_stat(
+            self,
+            universal_stat,
+            pt_stat,
+            [*_COMMON_CHECK_KEYS, "fparam", "aparam", "find_fparam", "find_aparam"],
+        )
+
+
+@unittest.skipUnless(INSTALLED_PT, "PyTorch backend not installed")
+class TestMakeStatInputSpin(unittest.TestCase):
+    """Test with data containing spin, multiple systems."""
+
+    def test_consistency(self) -> None:
+        data_dir = os.path.join(TESTS_DIR, "pt", "NiO", "data")
+        if not os.path.isdir(data_dir):
+            self.skipTest(f"NiO spin data not found: {data_dir}")
+
+        systems = [
+            os.path.join(data_dir, "data_0"),
+            os.path.join(data_dir, "data_0"),
+        ]
+        config = _build_config(systems, ["Ni", "O"])
+
+        data_requirement = [
+            *_ENER_DATA_REQ,
+            DataRequirementItem("spin", 3, atomic=True, must=True, high_prec=False),
+        ]
+        universal_stat = _get_universal_stat(config, data_requirement)
+        pt_stat = _get_pt_stat(config, data_requirement)
+
+        self.assertEqual(len(universal_stat), 2)
+        _compare_stat(
+            self,
+            universal_stat,
+            pt_stat,
+            [*_COMMON_CHECK_KEYS, "spin", "find_spin"],
+        )
+
+
+if __name__ == "__main__":
+    unittest.main()

From b9cb3583053887007b259a8d73abcfdb37b569d9 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 10:20:33 +0800
Subject: [PATCH 48/63] fix bug

---
 deepmd/pt_expt/train/training.py | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 4c3e902917..ce2a1039c0 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -715,6 +715,16 @@ def save_checkpoint(self, step: int) -> None:
     # Training loop
     # ------------------------------------------------------------------
 
+    @torch.compiler.disable
+    def _optimizer_step(self) -> None:
+        """Run optimizer and scheduler step outside torch._dynamo.
+
+        Dynamo intercepts tensor creation inside Adam._init_group,
+        which can trigger CUDA init on CPU-only builds.
+        """
+        self.optimizer.step()
+        self.scheduler.step()
+
     def run(self) -> None:
         fout = open(
             self.disp_file,
@@ -747,8 +757,7 @@ def run(self) -> None:
                     self.wrapper.parameters(), self.gradient_max_norm
                 )
 
-            self.optimizer.step()
-            self.scheduler.step()
+            self._optimizer_step()
 
             if self.timing_in_training:
                 t_end = time.time()

From 35e4edfe25634a91bef2e7c472c753a947a3ee2d Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 10:36:27 +0800
Subject: [PATCH 49/63] fix

---
 source/tests/pt_expt/test_training.py | 15 ++++++---------
 1 file changed, 6 insertions(+), 9 deletions(-)

diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index dd9cdda5b0..13f700b339 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -15,21 +15,18 @@
 
 import torch
 
-from deepmd.utils.argcheck import (
-    normalize,
-)
-from deepmd.utils.compat import (
-    update_deepmd_input,
-)
-
-torch = torch  # ensure torch is imported before pt_expt
-
 from deepmd.pt_expt.entrypoints.main import (
     get_trainer,
 )
 from deepmd.pt_expt.model import (
     get_model,
 )
+from deepmd.utils.argcheck import (
+    normalize,
+)
+from deepmd.utils.compat import (
+    update_deepmd_input,
+)
 
 EXAMPLE_DIR = os.path.join(
     os.path.dirname(__file__),

From b42e08d894b5a76609118db6bc8ea2f861ff407a Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 11:53:42 +0800
Subject: [PATCH 50/63] changed find_ to int. refactorizing get_data

---
 .../dpmodel/atomic_model/base_atomic_model.py |  7 +-
 deepmd/dpmodel/fitting/general_fitting.py     |  4 +-
 deepmd/dpmodel/utils/batch.py                 | 86 +++++++++++++++++++
 deepmd/dpmodel/utils/stat.py                  |  6 +-
 deepmd/pt_expt/train/training.py              | 68 +++++----------
 deepmd/utils/model_stat.py                    | 20 ++---
 .../tests/consistent/test_make_stat_input.py  |  7 +-
 7 files changed, 124 insertions(+), 74 deletions(-)
 create mode 100644 deepmd/dpmodel/utils/batch.py

diff --git a/deepmd/dpmodel/atomic_model/base_atomic_model.py b/deepmd/dpmodel/atomic_model/base_atomic_model.py
index 99d8a2dc99..1058dff570 100644
--- a/deepmd/dpmodel/atomic_model/base_atomic_model.py
+++ b/deepmd/dpmodel/atomic_model/base_atomic_model.py
@@ -339,15 +339,12 @@ def wrapped_sampler() -> list[dict]:
                 if default_fparam is not None:
                     default_fparam_np = np.array(default_fparam)
                     for sample in sampled:
-                        if (
-                            "find_fparam" in sample
-                            and float(sample["find_fparam"]) == 0.0
-                        ):
+                        if "find_fparam" in sample and not sample["find_fparam"]:
                             nframe = sample["atype"].shape[0]
                             sample["fparam"] = np.tile(
                                 default_fparam_np.reshape(1, -1), (nframe, 1)
                             )
-                            sample["find_fparam"] = np.float32(1.0)
+                            sample["find_fparam"] = np.bool_(True)
             return sampled
 
         return wrapped_sampler
diff --git a/deepmd/dpmodel/fitting/general_fitting.py b/deepmd/dpmodel/fitting/general_fitting.py
index f1ac86dde8..180e5458fb 100644
--- a/deepmd/dpmodel/fitting/general_fitting.py
+++ b/deepmd/dpmodel/fitting/general_fitting.py
@@ -272,7 +272,7 @@ def compute_input_stats(
                             f"numb_fparam > 0 but fparam is not acquired "
                             f"for system {ii}."
                         )
-                    if float(frame["find_fparam"]) != 1.0:
+                    if not frame["find_fparam"]:
                         raise ValueError(
                             f"numb_fparam > 0 but no fparam data is provided "
                             f"for system {ii}."
@@ -330,7 +330,7 @@ def compute_input_stats(
                             f"numb_aparam > 0 but aparam is not acquired "
                             f"for system {ii}."
                         )
-                    if float(frame["find_aparam"]) != 1.0:
+                    if not frame["find_aparam"]:
                         raise ValueError(
                             f"numb_aparam > 0 but no aparam data is provided "
                             f"for system {ii}."
diff --git a/deepmd/dpmodel/utils/batch.py b/deepmd/dpmodel/utils/batch.py
new file mode 100644
index 0000000000..204ae9771f
--- /dev/null
+++ b/deepmd/dpmodel/utils/batch.py
@@ -0,0 +1,86 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Normalize raw batches from DeepmdDataSystem into canonical format."""
+
+from typing import (
+    Any,
+)
+
+import numpy as np
+
+# Keys that are metadata / not needed by models or loss functions.
+_DROP_KEYS = {"default_mesh", "sid", "fid"}
+
+# Keys that belong to model input (everything else is label).
+_INPUT_KEYS = {"coord", "atype", "spin", "box", "fparam", "aparam"}
+
+
+def normalize_batch(batch: dict[str, Any]) -> dict[str, Any]:
+    """Normalize a raw batch from :class:`DeepmdDataSystem` to canonical format.
+
+    The following conversions are applied:
+
+    * ``"type"`` is renamed to ``"atype"`` (int64).
+    * ``"natoms_vec"`` (1-D) is tiled to 2-D ``[nframes, 2+ntypes]``
+      and stored as ``"natoms"``.
+    * ``find_*`` flags are converted to ``np.bool_``.
+    * Metadata keys (``default_mesh``, ``sid``, ``fid``) are dropped.
+
+    Parameters
+    ----------
+    batch : dict[str, Any]
+        Raw batch dict returned by ``DeepmdDataSystem.get_batch()``.
+
+    Returns
+    -------
+    dict[str, Any]
+        Normalized batch dict (new dict; the input is not mutated).
+    """
+    out: dict[str, Any] = {}
+
+    for key, val in batch.items():
+        if key in _DROP_KEYS:
+            continue
+
+        if key == "type":
+            out["atype"] = val.astype(np.int64)
+        elif key.startswith("find_"):
+            out[key] = np.bool_(float(val) > 0.5)
+        elif key == "natoms_vec":
+            nv = val
+            if nv.ndim == 1 and "coord" in batch:
+                nframes = batch["coord"].shape[0]
+                nv = np.tile(nv, (nframes, 1))
+            out["natoms"] = nv
+        else:
+            out[key] = val
+
+    return out
+
+
+def split_batch(
+    batch: dict[str, Any],
+) -> tuple[dict[str, Any], dict[str, Any]]:
+    """Split a normalized batch into input and label dicts.
+
+    Parameters
+    ----------
+    batch : dict[str, Any]
+        Normalized batch (output of :func:`normalize_batch`).
+
+    Returns
+    -------
+    input_dict : dict[str, Any]
+        Model inputs (coord, atype, box, fparam, aparam, spin).
+    label_dict : dict[str, Any]
+        Labels and find flags (energy, force, virial, find_*, natoms, …).
+    """
+    input_dict: dict[str, Any] = {}
+    label_dict: dict[str, Any] = {}
+
+    for key, val in batch.items():
+        if key in _INPUT_KEYS:
+            input_dict[key] = val
+        else:
+            label_dict[key] = val
+
+    return input_dict, label_dict
diff --git a/deepmd/dpmodel/utils/stat.py b/deepmd/dpmodel/utils/stat.py
index 34c500d7c8..8cb379380a 100644
--- a/deepmd/dpmodel/utils/stat.py
+++ b/deepmd/dpmodel/utils/stat.py
@@ -244,11 +244,9 @@ def compute_output_stats(
 
         for kk in keys:
             for idx, system in enumerate(sampled):
-                if (("find_atom_" + kk) in system) and (
-                    system["find_atom_" + kk] > 0.0
-                ):
+                if (("find_atom_" + kk) in system) and system["find_atom_" + kk]:
                     atomic_sampled_idx[kk].append(idx)
-                if (("find_" + kk) in system) and (system["find_" + kk] > 0.0):
+                if (("find_" + kk) in system) and system["find_" + kk]:
                     global_sampled_idx[kk].append(idx)
 
         # use index to gather model predictions for the corresponding systems.
diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index ce2a1039c0..1856e5eb29 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -22,6 +22,10 @@
 import numpy as np
 import torch
 
+from deepmd.dpmodel.utils.batch import (
+    normalize_batch,
+    split_batch,
+)
 from deepmd.dpmodel.utils.learning_rate import (
     LearningRateExp,
 )
@@ -639,56 +643,30 @@ def get_data(
         if data_sys is None:
             return {}, {}
 
-        batch = data_sys.get_batch()  # numpy dict
-
-        input_keys = {"coord", "box", "fparam", "aparam"}
-        input_dict: dict[str, Any] = {}
-        label_dict: dict[str, Any] = {}
-
-        natoms = batch["type"].shape[-1]
+        batch = normalize_batch(data_sys.get_batch())
+        input_dict, label_dict = split_batch(batch)
 
-        for key, val in batch.items():
-            if key == "type":
-                # rename to atype; convert to int64 tensor
-                input_dict["atype"] = torch.from_numpy(val.astype(np.int64)).to(DEVICE)
-            elif key == "coord":
-                # reshape from [nf, natoms*3] → [nf, natoms, 3]
-                t = torch.from_numpy(val.copy()).to(
+        # Convert numpy arrays to torch tensors.
+        for key, val in input_dict.items():
+            if val is None or not isinstance(val, np.ndarray):
+                continue
+            if np.issubdtype(val.dtype, np.integer):
+                input_dict[key] = torch.from_numpy(val).to(DEVICE)
+            else:
+                input_dict[key] = torch.from_numpy(val).to(
                     dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
                 )
-                # requires_grad needed for force computation via autograd
-                input_dict["coord"] = t.reshape(-1, natoms, 3).requires_grad_(True)
-            elif key == "box":
-                if val is not None:
-                    t = torch.from_numpy(val).to(
-                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
-                    )
-                    input_dict["box"] = t.reshape(-1, 3, 3)
-                else:
-                    input_dict["box"] = None
-            elif key in input_keys:
-                if val is not None and isinstance(val, np.ndarray):
-                    input_dict[key] = torch.from_numpy(val).to(
-                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
-                    )
-            elif key in ("natoms_vec", "default_mesh", "sid", "fid"):
-                continue
-            elif "find_" in key:
-                # find_energy, find_force, … — keep as float scalar
-                label_dict[key] = float(val) if not isinstance(val, float) else val
-            elif key == "force":
-                # [nf, natoms*3] → [nf, natoms, 3]
-                t = torch.from_numpy(val).to(
+        # requires_grad on coord for force computation via autograd
+        if "coord" in input_dict and input_dict["coord"] is not None:
+            input_dict["coord"] = input_dict["coord"].requires_grad_(True)
+
+        for key, val in label_dict.items():
+            if key.startswith("find_"):
+                label_dict[key] = float(val)
+            elif isinstance(val, np.ndarray):
+                label_dict[key] = torch.from_numpy(val).to(
                     dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
                 )
-                label_dict["force"] = t.reshape(-1, natoms, 3)
-            else:
-                if isinstance(val, np.ndarray):
-                    label_dict[key] = torch.from_numpy(val).to(
-                        dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
-                    )
-                else:
-                    label_dict[key] = val
 
         return input_dict, label_dict
 
diff --git a/deepmd/utils/model_stat.py b/deepmd/utils/model_stat.py
index 539681bdf4..33ebbcae57 100644
--- a/deepmd/utils/model_stat.py
+++ b/deepmd/utils/model_stat.py
@@ -9,6 +9,10 @@
 
 import numpy as np
 
+from deepmd.dpmodel.utils.batch import (
+    normalize_batch,
+)
+
 log = logging.getLogger(__name__)
 
 
@@ -113,21 +117,7 @@ def make_stat_input(
                 # scalar flags like find_*
                 merged[key] = vals[0]
 
-        # DeepmdDataSystem.get_batch() uses "type"; stat consumers expect "atype".
-        if "type" in merged and "atype" not in merged:
-            merged["atype"] = merged.pop("type")
-
-        # Provide "natoms" from "natoms_vec".
-        # natoms_vec from get_batch() is 1D [2+ntypes], but
-        # compute_output_stats expects 2D [nframes, 2+ntypes].
-        if "natoms_vec" in merged:
-            nv = merged["natoms_vec"]
-            if nv.ndim == 1:
-                nframes = merged["coord"].shape[0]
-                nv = np.tile(nv, (nframes, 1))
-            merged["natoms"] = nv
-
-        lst.append(merged)
+        lst.append(normalize_batch(merged))
     return lst
 
 
diff --git a/source/tests/consistent/test_make_stat_input.py b/source/tests/consistent/test_make_stat_input.py
index 973e209ed9..5a927f5541 100644
--- a/source/tests/consistent/test_make_stat_input.py
+++ b/source/tests/consistent/test_make_stat_input.py
@@ -192,7 +192,7 @@ def _compare_stat(
             if in_uni and not in_pt:
                 find_key = f"find_{key}" if not key.startswith("find_") else key
                 find_val = universal_stat[sys_idx].get(find_key, None)
-                if find_val is not None and float(find_val) == 0.0:
+                if find_val is not None and not find_val:
                     continue
             test_case.assertEqual(
                 in_uni, in_pt, f"system {sys_idx}: key '{key}' presence mismatch"
@@ -204,9 +204,10 @@ def _compare_stat(
             v_pt = _to_numpy(pt_stat[sys_idx][key])
 
             if key.startswith("find_"):
+                # universal returns bool, pt returns float32
                 test_case.assertEqual(
-                    float(np.ravel(v_uni)[0]),
-                    float(np.ravel(v_pt)[0]),
+                    bool(v_uni),
+                    bool(float(np.ravel(v_pt)[0]) > 0.5),
                     f"system {sys_idx}, key '{key}': find flag mismatch",
                 )
                 continue

From 3e8ba6ec47cf2f47ab972ec864e23b01d97e176f Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 18:08:48 +0800
Subject: [PATCH 51/63] port dpmodel loss to pt_expt and use user-facing model
 output keys

  Replace pt backend loss (deepmd.pt.loss) in pt_expt training with a
  @torch_module wrapper around the dpmodel EnergyLoss. This follows
  the same wrapping pattern used for descriptors and fittings.

  - Update dpmodel/loss/ener.py to read user-facing model output keys
  (energy, force, virial, atom_energy) instead of internal keys
  (energy_redu, energy_derv_r, energy_derv_c_redu, energy).
  - Fix dpmodel/loss/loss.py display_if_exist to pass device= to
  xp.asarray, inferred from the existing loss tensor.
  - Create pt_expt/loss/ener.py with @torch_module wrapper.
  - Update pt_expt/train/wrapper.py to call model first, then pass
  model predictions to the dpmodel loss interface.
  - Simplify pt_expt/train/training.py: use deepmd.pt_expt.loss,
  unify numpy-to-torch conversion for input and label dicts.
  - Add find_fparam/find_aparam flags to fitting stat test data.
  - Add pt_expt loss unit tests (consistency + dpmodel cross-check).
  - Add conftest fixture to clear leaked DeviceContext from make_fx
  (works around PyTorch bug in Adam._init_group where
  torch.tensor(0.0) omits device= on the default path).
---
 deepmd/dpmodel/loss/ener.py                   |   8 +-
 deepmd/dpmodel/loss/loss.py                   |   5 +-
 deepmd/pt_expt/loss/__init__.py               |   8 +
 deepmd/pt_expt/loss/ener.py                   |  10 ++
 deepmd/pt_expt/train/training.py              |  52 +++----
 deepmd/pt_expt/train/wrapper.py               |  12 +-
 source/tests/consistent/loss/test_ener.py     |   8 +-
 source/tests/pt_expt/conftest.py              |  50 +++++-
 .../pt_expt/fitting/test_fitting_stat.py      |   2 +
 source/tests/pt_expt/loss/__init__.py         |   1 +
 source/tests/pt_expt/loss/test_ener.py        | 144 ++++++++++++++++++
 source/tests/pt_expt/test_training.py         |  15 +-
 12 files changed, 261 insertions(+), 54 deletions(-)
 create mode 100644 deepmd/pt_expt/loss/__init__.py
 create mode 100644 deepmd/pt_expt/loss/ener.py
 create mode 100644 source/tests/pt_expt/loss/__init__.py
 create mode 100644 source/tests/pt_expt/loss/test_ener.py

diff --git a/deepmd/dpmodel/loss/ener.py b/deepmd/dpmodel/loss/ener.py
index 3bf9695852..e512072509 100644
--- a/deepmd/dpmodel/loss/ener.py
+++ b/deepmd/dpmodel/loss/ener.py
@@ -95,10 +95,10 @@ def call(
         label_dict: dict[str, Array],
     ) -> dict[str, Array]:
         """Calculate loss from model results and labeled results."""
-        energy = model_dict["energy_redu"]
-        force = model_dict["energy_derv_r"]
-        virial = model_dict["energy_derv_c_redu"]
-        atom_ener = model_dict["energy"]
+        energy = model_dict["energy"]
+        force = model_dict["force"]
+        virial = model_dict["virial"]
+        atom_ener = model_dict["atom_energy"]
         energy_hat = label_dict["energy"]
         force_hat = label_dict["force"]
         virial_hat = label_dict["virial"]
diff --git a/deepmd/dpmodel/loss/loss.py b/deepmd/dpmodel/loss/loss.py
index 6dc468582a..4b9831c344 100644
--- a/deepmd/dpmodel/loss/loss.py
+++ b/deepmd/dpmodel/loss/loss.py
@@ -53,8 +53,11 @@ def display_if_exist(loss: Array, find_property: float) -> Array:
             the loss scalar or NaN
         """
         xp = array_api_compat.array_namespace(loss)
+        dev = array_api_compat.device(loss)
         return xp.where(
-            xp.asarray(find_property, dtype=xp.bool), loss, xp.asarray(xp.nan)
+            xp.asarray(find_property, dtype=xp.bool, device=dev),
+            loss,
+            xp.asarray(xp.nan, device=dev),
         )
 
     @classmethod
diff --git a/deepmd/pt_expt/loss/__init__.py b/deepmd/pt_expt/loss/__init__.py
new file mode 100644
index 0000000000..19f76a0cba
--- /dev/null
+++ b/deepmd/pt_expt/loss/__init__.py
@@ -0,0 +1,8 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from deepmd.pt_expt.loss.ener import (
+    EnergyLoss,
+)
+
+__all__ = [
+    "EnergyLoss",
+]
diff --git a/deepmd/pt_expt/loss/ener.py b/deepmd/pt_expt/loss/ener.py
new file mode 100644
index 0000000000..e5bd220bd0
--- /dev/null
+++ b/deepmd/pt_expt/loss/ener.py
@@ -0,0 +1,10 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from deepmd.dpmodel.loss.ener import EnergyLoss as EnergyLossDP
+from deepmd.pt_expt.common import (
+    torch_module,
+)
+
+
+@torch_module
+class EnergyLoss(EnergyLossDP):
+    pass
diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 1856e5eb29..50354af79f 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -32,10 +32,8 @@
 from deepmd.loggers.training import (
     format_training_message_per_task,
 )
-from deepmd.pt.loss import (
-    EnergyHessianStdLoss,
-    EnergyStdLoss,
-    TaskLoss,
+from deepmd.pt_expt.loss import (
+    EnergyLoss,
 )
 from deepmd.pt_expt.model import (
     get_model,
@@ -73,17 +71,13 @@ def get_loss(
     start_lr: float,
     _ntypes: int,
     _model: Any,
-) -> TaskLoss:
+) -> EnergyLoss:
     loss_type = loss_params.get("type", "ener")
-    if loss_type == "ener" and loss_params.get("start_pref_h", 0.0) > 0.0:
+    if loss_type == "ener":
         loss_params["starter_learning_rate"] = start_lr
-        return EnergyHessianStdLoss(**loss_params)
-    elif loss_type == "ener":
-        loss_params["starter_learning_rate"] = start_lr
-        return EnergyStdLoss(**loss_params)
+        return EnergyLoss(**loss_params)
     else:
-        loss_params["starter_learning_rate"] = start_lr
-        return TaskLoss.get_class_by_type(loss_type).get_loss(loss_params)
+        raise ValueError(f"Unsupported loss type for pt_expt: {loss_type}")
 
 
 def get_additional_data_requirement(_model: Any) -> list[DataRequirementItem]:
@@ -646,28 +640,26 @@ def get_data(
         batch = normalize_batch(data_sys.get_batch())
         input_dict, label_dict = split_batch(batch)
 
-        # Convert numpy arrays to torch tensors.
-        for key, val in input_dict.items():
-            if val is None or not isinstance(val, np.ndarray):
-                continue
-            if np.issubdtype(val.dtype, np.integer):
-                input_dict[key] = torch.from_numpy(val).to(DEVICE)
-            else:
-                input_dict[key] = torch.from_numpy(val).to(
-                    dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
-                )
+        # Convert numpy values to torch tensors.
+        for dd in (input_dict, label_dict):
+            for key, val in dd.items():
+                if val is None:
+                    continue
+                if isinstance(val, np.ndarray):
+                    if np.issubdtype(val.dtype, np.integer):
+                        dd[key] = torch.from_numpy(val).to(DEVICE)
+                    else:
+                        dd[key] = torch.from_numpy(val).to(
+                            dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                        )
+                elif isinstance(val, (float, np.bool_)):
+                    dd[key] = torch.tensor(
+                        float(val), dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
+                    )
         # requires_grad on coord for force computation via autograd
         if "coord" in input_dict and input_dict["coord"] is not None:
             input_dict["coord"] = input_dict["coord"].requires_grad_(True)
 
-        for key, val in label_dict.items():
-            if key.startswith("find_"):
-                label_dict[key] = float(val)
-            elif isinstance(val, np.ndarray):
-                label_dict[key] = torch.from_numpy(val).to(
-                    dtype=GLOBAL_PT_FLOAT_PRECISION, device=DEVICE
-                )
-
         return input_dict, label_dict
 
     # ------------------------------------------------------------------
diff --git a/deepmd/pt_expt/train/wrapper.py b/deepmd/pt_expt/train/wrapper.py
index d646cb79ab..281168cdba 100644
--- a/deepmd/pt_expt/train/wrapper.py
+++ b/deepmd/pt_expt/train/wrapper.py
@@ -60,17 +60,17 @@ def forward(
             "aparam": aparam,
         }
 
+        model_pred = self.model(**input_dict)
+
         if self.inference_only or label is None:
-            model_pred = self.model(**input_dict)
             return model_pred, None, None
         else:
             natoms = atype.shape[-1]
-            model_pred, loss, more_loss = self.loss(
-                input_dict,
-                self.model,
+            loss, more_loss = self.loss(
+                cur_lr,
+                natoms,
+                model_pred,
                 label,
-                natoms=natoms,
-                learning_rate=cur_lr,
             )
             return model_pred, loss, more_loss
 
diff --git a/source/tests/consistent/loss/test_ener.py b/source/tests/consistent/loss/test_ener.py
index 36a8fba44a..b23ab1c01c 100644
--- a/source/tests/consistent/loss/test_ener.py
+++ b/source/tests/consistent/loss/test_ener.py
@@ -111,10 +111,10 @@ def setUp(self) -> None:
             ),
         }
         self.predict_dpmodel_style = {
-            "energy_derv_c_redu": self.predict["virial"],
-            "energy_derv_r": self.predict["force"],
-            "energy_redu": self.predict["energy"],
-            "energy": self.predict["atom_ener"],
+            "energy": self.predict["energy"],
+            "force": self.predict["force"],
+            "virial": self.predict["virial"],
+            "atom_energy": self.predict["atom_ener"],
         }
         self.label = {
             "energy": rng.random((self.nframes,)),
diff --git a/source/tests/pt_expt/conftest.py b/source/tests/pt_expt/conftest.py
index ec025c2202..15791050d6 100644
--- a/source/tests/pt_expt/conftest.py
+++ b/source/tests/pt_expt/conftest.py
@@ -1,4 +1,52 @@
 # SPDX-License-Identifier: LGPL-3.0-or-later
+"""Conftest for pt_expt tests.
+
+Clears any leaked ``torch.utils._device.DeviceContext`` modes that may
+have been left on the torch function mode stack by ``make_fx`` or other
+tracing utilities during test collection.  A stale ``DeviceContext``
+silently reroutes ``torch.tensor(...)`` calls (without an explicit
+``device=``) to a fake CUDA device, causing spurious "no NVIDIA driver"
+errors on CPU-only machines.
+
+The leak is triggered when pytest collects descriptor test modules that
+import ``make_fx``.  A ``DeviceContext(cuda:127)`` ends up on the
+``torch.overrides`` function mode stack and is never popped.
+
+Our own code (``display_if_exist`` in ``deepmd/dpmodel/loss/loss.py``)
+is already fixed to pass ``device=`` explicitly.  However, PyTorch's
+``Adam._init_group`` (``torch/optim/adam.py``) contains::
+
+    torch.tensor(0.0, dtype=_get_scalar_dtype())  # no device=
+
+on the ``capturable=False, fused=False`` path (the default).  This is
+a PyTorch bug — the ``capturable=True`` branch correctly uses
+``device=p.device`` but the default branch omits it.  We cannot fix
+PyTorch internals, so this fixture works around the issue by popping
+leaked ``DeviceContext`` modes before each test.
+"""
+
 import pytest
+import torch.utils._device as _device
+from torch.overrides import (
+    _get_current_function_mode_stack,
+)
+
 
-pytest.importorskip("torch")
+@pytest.fixture(autouse=True)
+def _clear_leaked_device_context():
+    """Pop any stale ``DeviceContext`` before each test, restore after."""
+    popped = []
+    while True:
+        modes = _get_current_function_mode_stack()
+        if not modes:
+            break
+        top = modes[-1]
+        if isinstance(top, _device.DeviceContext):
+            top.__exit__(None, None, None)
+            popped.append(top)
+        else:
+            break
+    yield
+    # Restore in reverse order so the stack is back to its original state.
+    for ctx in reversed(popped):
+        ctx.__enter__()
diff --git a/source/tests/pt_expt/fitting/test_fitting_stat.py b/source/tests/pt_expt/fitting/test_fitting_stat.py
index b473c9309c..dcb99dd324 100644
--- a/source/tests/pt_expt/fitting/test_fitting_stat.py
+++ b/source/tests/pt_expt/fitting/test_fitting_stat.py
@@ -40,6 +40,8 @@ def _make_fake_data_pt(sys_natoms, sys_nframes, avgs, stds):
         # dpmodel's compute_input_stats expects numpy arrays
         sys_dict["fparam"] = tmp_data_f
         sys_dict["aparam"] = tmp_data_a
+        sys_dict["find_fparam"] = True
+        sys_dict["find_aparam"] = True
         merged_output_stat.append(sys_dict)
     return merged_output_stat
 
diff --git a/source/tests/pt_expt/loss/__init__.py b/source/tests/pt_expt/loss/__init__.py
new file mode 100644
index 0000000000..6ceb116d85
--- /dev/null
+++ b/source/tests/pt_expt/loss/__init__.py
@@ -0,0 +1 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
diff --git a/source/tests/pt_expt/loss/test_ener.py b/source/tests/pt_expt/loss/test_ener.py
new file mode 100644
index 0000000000..37d7d4c703
--- /dev/null
+++ b/source/tests/pt_expt/loss/test_ener.py
@@ -0,0 +1,144 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Unit tests for the pt_expt EnergyLoss wrapper.
+
+Three test types:
+- test_consistency — construct -> forward -> serialize/deserialize -> forward -> compare;
+  also compare with dpmodel
+- test_consistency_with_find_flags — same but with find_* flags as torch tensors
+  (mimicking real training where get_data converts them)
+"""
+
+import numpy as np
+import pytest
+import torch
+
+from deepmd.dpmodel.loss.ener import EnergyLoss as EnergyLossDP
+from deepmd.pt_expt.loss.ener import (
+    EnergyLoss,
+)
+from deepmd.pt_expt.utils import (
+    env,
+)
+from deepmd.pt_expt.utils.env import (
+    PRECISION_DICT,
+)
+
+from ...pt.model.test_mlp import (
+    get_tols,
+)
+from ...seed import (
+    GLOBAL_SEED,
+)
+
+
+def _make_data(
+    rng: np.random.Generator,
+    nframes: int,
+    natoms: int,
+    dtype: torch.dtype,
+    device: torch.device,
+) -> tuple[dict[str, torch.Tensor], dict[str, torch.Tensor]]:
+    """Build model prediction and label dicts as torch tensors."""
+    model_pred = {
+        "energy": torch.tensor(rng.random((nframes,)), dtype=dtype, device=device),
+        "force": torch.tensor(
+            rng.random((nframes, natoms, 3)), dtype=dtype, device=device
+        ),
+        "virial": torch.tensor(rng.random((nframes, 9)), dtype=dtype, device=device),
+        "atom_energy": torch.tensor(
+            rng.random((nframes, natoms)), dtype=dtype, device=device
+        ),
+    }
+    label = {
+        "energy": torch.tensor(rng.random((nframes,)), dtype=dtype, device=device),
+        "force": torch.tensor(
+            rng.random((nframes, natoms, 3)), dtype=dtype, device=device
+        ),
+        "virial": torch.tensor(rng.random((nframes, 9)), dtype=dtype, device=device),
+        "atom_ener": torch.tensor(
+            rng.random((nframes, natoms)), dtype=dtype, device=device
+        ),
+        "atom_pref": torch.ones((nframes, natoms, 3), dtype=dtype, device=device),
+        "find_energy": torch.tensor(1.0, dtype=dtype, device=device),
+        "find_force": torch.tensor(1.0, dtype=dtype, device=device),
+        "find_virial": torch.tensor(1.0, dtype=dtype, device=device),
+        "find_atom_ener": torch.tensor(1.0, dtype=dtype, device=device),
+        "find_atom_pref": torch.tensor(1.0, dtype=dtype, device=device),
+    }
+    return model_pred, label
+
+
+class TestEnergyLoss:
+    def setup_method(self) -> None:
+        self.device = env.DEVICE
+
+    @pytest.mark.parametrize("prec", ["float64", "float32"])  # precision
+    @pytest.mark.parametrize("use_huber", [False, True])  # huber loss
+    def test_consistency(self, prec, use_huber) -> None:
+        """Construct -> forward -> serialize/deserialize -> forward -> compare.
+
+        Also compare with dpmodel.
+        """
+        rng = np.random.default_rng(GLOBAL_SEED)
+        nframes, natoms = 2, 6
+        dtype = PRECISION_DICT[prec]
+        rtol, atol = get_tols(prec)
+        learning_rate = 1e-3
+
+        loss0 = EnergyLoss(
+            starter_learning_rate=1e-3,
+            start_pref_e=0.02,
+            limit_pref_e=1.0,
+            start_pref_f=1000.0,
+            limit_pref_f=1.0,
+            start_pref_v=1.0,
+            limit_pref_v=1.0,
+            start_pref_ae=1.0,
+            limit_pref_ae=1.0,
+            start_pref_pf=0.0 if use_huber else 1.0,
+            limit_pref_pf=0.0 if use_huber else 1.0,
+            use_huber=use_huber,
+        ).to(self.device)
+
+        model_pred, label = _make_data(rng, nframes, natoms, dtype, self.device)
+
+        # Forward
+        l0, more0 = loss0(learning_rate, natoms, model_pred, label)
+        assert l0.shape == ()
+        assert "rmse" in more0
+
+        # Serialize / deserialize round-trip
+        loss1 = EnergyLoss.deserialize(loss0.serialize())
+        l1, more1 = loss1(learning_rate, natoms, model_pred, label)
+
+        np.testing.assert_allclose(
+            l0.detach().cpu().numpy(),
+            l1.detach().cpu().numpy(),
+            rtol=rtol,
+            atol=atol,
+        )
+        for key in more0:
+            np.testing.assert_allclose(
+                more0[key].detach().cpu().numpy(),
+                more1[key].detach().cpu().numpy(),
+                rtol=rtol,
+                atol=atol,
+                err_msg=f"key={key}",
+            )
+
+        # Compare with dpmodel (numpy)
+        dp_loss = EnergyLossDP.deserialize(loss0.serialize())
+        model_pred_np = {k: v.detach().cpu().numpy() for k, v in model_pred.items()}
+        label_np = {
+            k: v.detach().cpu().numpy() if isinstance(v, torch.Tensor) else v
+            for k, v in label.items()
+        }
+        l_dp, more_dp = dp_loss(learning_rate, natoms, model_pred_np, label_np)
+
+        np.testing.assert_allclose(
+            l0.detach().cpu().numpy(),
+            np.array(l_dp),
+            rtol=rtol,
+            atol=atol,
+            err_msg="pt_expt vs dpmodel",
+        )
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 13f700b339..1943f67915 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -256,17 +256,16 @@ def test_batch_shapes(self) -> None:
                 trainer = get_trainer(config)
                 input_dict, label_dict = trainer.get_data(is_train=True)
 
-                # coord should be [nf, natoms, 3]
-                self.assertEqual(len(input_dict["coord"].shape), 3)
-                self.assertEqual(input_dict["coord"].shape[-1], 3)
+                # coord should be a tensor with requires_grad
+                self.assertIsInstance(input_dict["coord"], torch.Tensor)
+                self.assertTrue(input_dict["coord"].requires_grad)
 
-                # atype should be [nf, natoms]
-                self.assertEqual(len(input_dict["atype"].shape), 2)
+                # atype should be an integer tensor
+                self.assertIsInstance(input_dict["atype"], torch.Tensor)
 
-                # force label should be [nf, natoms, 3]
+                # force label should be a tensor
                 if "force" in label_dict:
-                    self.assertEqual(len(label_dict["force"].shape), 3)
-                    self.assertEqual(label_dict["force"].shape[-1], 3)
+                    self.assertIsInstance(label_dict["force"], torch.Tensor)
 
                 # energy label should exist
                 self.assertIn("energy", label_dict)

From 18b39e32a76de755729489630852bbad747a322f Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 22:05:28 +0800
Subject: [PATCH 52/63] use full like

---
 deepmd/dpmodel/utils/env_mat.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/deepmd/dpmodel/utils/env_mat.py b/deepmd/dpmodel/utils/env_mat.py
index b979d6a507..e9407a435b 100644
--- a/deepmd/dpmodel/utils/env_mat.py
+++ b/deepmd/dpmodel/utils/env_mat.py
@@ -28,8 +28,8 @@ def compute_smooth_weight(
     xp = array_api_compat.array_namespace(distance)
     # Use where instead of clip so that make_fx tracing does not
     # decompose it into boolean-indexed ops with data-dependent sizes.
-    distance = xp.where(distance < rmin, rmin * xp.ones_like(distance), distance)
-    distance = xp.where(distance > rmax, rmax * xp.ones_like(distance), distance)
+    distance = xp.where(distance < rmin, xp.full_like(distance, rmin), distance)
+    distance = xp.where(distance > rmax, xp.full_like(distance, rmax), distance)
     uu = (distance - rmin) / (rmax - rmin)
     uu2 = uu * uu
     vv = uu2 * uu * (-6.0 * uu2 + 15.0 * uu - 10.0) + 1.0
@@ -46,7 +46,7 @@ def compute_exp_sw(
         raise ValueError("rmin should be less than rmax.")
     xp = array_api_compat.array_namespace(distance)
     distance = xp.where(distance < 0.0, xp.zeros_like(distance), distance)
-    distance = xp.where(distance > rmax, rmax * xp.ones_like(distance), distance)
+    distance = xp.where(distance > rmax, xp.full_like(distance, rmax), distance)
     C = 20
     a = C / rmin
     b = rmin

From f4675d12cac56e1e1a1ac12bfd16158138c7901a Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 22:11:04 +0800
Subject: [PATCH 53/63] fix bugs in ut

---
 source/tests/consistent/fitting/test_ener.py | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/source/tests/consistent/fitting/test_ener.py b/source/tests/consistent/fitting/test_ener.py
index 185a3d5801..ba0f68c163 100644
--- a/source/tests/consistent/fitting/test_ener.py
+++ b/source/tests/consistent/fitting/test_ener.py
@@ -523,6 +523,8 @@ def setUp(self) -> None:
                 "aparam": rng.normal(size=(2, 6, numb_aparam)).astype(
                     GLOBAL_NP_FLOAT_PRECISION
                 ),
+                "find_fparam": True,
+                "find_aparam": True,
             },
             {
                 "fparam": rng.normal(size=(3, numb_fparam)).astype(
@@ -531,6 +533,8 @@ def setUp(self) -> None:
                 "aparam": rng.normal(size=(3, 6, numb_aparam)).astype(
                     GLOBAL_NP_FLOAT_PRECISION
                 ),
+                "find_fparam": True,
+                "find_aparam": True,
             },
         ]
 
@@ -583,6 +587,8 @@ def eval_pt(self, pt_obj: Any) -> Any:
             {
                 "fparam": torch.from_numpy(d["fparam"]).to(PT_DEVICE),
                 "aparam": torch.from_numpy(d["aparam"]).to(PT_DEVICE),
+                "find_fparam": d["find_fparam"],
+                "find_aparam": d["find_aparam"],
             }
             for d in self.stat_data
         ]
@@ -669,6 +675,8 @@ def eval_jax(self, jax_obj: Any) -> Any:
             {
                 "fparam": jnp.asarray(d["fparam"]),
                 "aparam": jnp.asarray(d["aparam"]),
+                "find_fparam": d["find_fparam"],
+                "find_aparam": d["find_aparam"],
             }
             for d in self.stat_data
         ]
@@ -696,6 +704,8 @@ def eval_array_api_strict(self, array_api_strict_obj: Any) -> Any:
             {
                 "fparam": array_api_strict.asarray(d["fparam"]),
                 "aparam": array_api_strict.asarray(d["aparam"]),
+                "find_fparam": d["find_fparam"],
+                "find_aparam": d["find_aparam"],
             }
             for d in self.stat_data
         ]
@@ -727,6 +737,8 @@ def eval_pd(self, pd_obj: Any) -> Any:
             {
                 "fparam": paddle.to_tensor(d["fparam"]).to(PD_DEVICE),
                 "aparam": paddle.to_tensor(d["aparam"]).to(PD_DEVICE),
+                "find_fparam": d["find_fparam"],
+                "find_aparam": d["find_aparam"],
             }
             for d in self.stat_data
         ]

From 4eb92d38b8723cf01e64b9bef70735c10bc5eae7 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 22:57:25 +0800
Subject: [PATCH 54/63] fix: compiled training force loss not decreasing

  Three bugs prevented force loss from decreasing when enable_compile=True:

  1. make_fx traced with model.eval(), capturing create_graph=False in the
     decomposed autograd.grad ops. Force tensors were detached from model
     parameters, so force loss backprop could not reach the weights.
     Fix: trace in model.train() mode.

  2. _CompiledModel.forward() used extended_force[:, :nloc, :] instead of
     scatter-summing ghost atom contributions via mapping. This produced
     wrong force values for periodic systems.
     Fix: use scatter_add_ with mapping, matching communicate_extended_output.

  3. torch.compile inductor backend silently drops second-order gradients
     through make_fx-decomposed autograd.grad ops (verified: 0/32 params
     receive grad with inductor vs 24/32 with aot_eager).
     Fix: default to aot_eager backend.
---
 deepmd/pt_expt/train/training.py      | 37 ++++++++--
 source/tests/pt_expt/test_training.py | 99 +++++++++++++++++++++++++++
 2 files changed, 131 insertions(+), 5 deletions(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 50354af79f..5b80556197 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -137,7 +137,12 @@ def _trace_and_compile(
     )
 
     was_training = model.training
-    model.eval()
+    # Trace in train mode so that create_graph=True is captured inside
+    # task_deriv_one.  Without this, the autograd.grad that computes
+    # forces is traced with create_graph=False (eval mode), producing
+    # force tensors that are detached from model parameters — force loss
+    # backprop cannot reach the weights and force RMSE never decreases.
+    model.train()
 
     def fn(
         extended_coord: torch.Tensor,
@@ -162,9 +167,15 @@ def fn(
     # change at runtime, the caller catches the error and retraces.
     traced_lower = make_fx(fn)(ext_coord, ext_atype, nlist, mapping, fparam, aparam)
 
-    if was_training:
-        model.train()
+    if not was_training:
+        model.eval()
 
+    # The inductor backend does not propagate gradients through the
+    # make_fx-decomposed autograd.grad ops (second-order gradients for
+    # force training).  Use "aot_eager" which correctly preserves the
+    # gradient chain while still benefiting from make_fx decomposition.
+    if "backend" not in compile_opts:
+        compile_opts["backend"] = "aot_eager"
     compiled_lower = torch.compile(traced_lower, dynamic=False, **compile_opts)
     return compiled_lower
 
@@ -299,12 +310,28 @@ def forward(
             ext_coord, ext_atype, nlist, mapping, fparam, aparam
         )
 
-        # Translate forward_lower keys -> forward keys
+        # Translate forward_lower keys -> forward keys.
+        # ``extended_force`` lives on all extended atoms (nf, nall, 3).
+        # Ghost-atom forces must be scatter-summed back to local atoms
+        # via ``mapping`` — the same operation ``communicate_extended_output``
+        # performs in the uncompiled path.
         out: dict[str, torch.Tensor] = {}
         out["atom_energy"] = result["atom_energy"]
         out["energy"] = result["energy"]
         if "extended_force" in result:
-            out["force"] = result["extended_force"][:, :nloc, :]
+            ext_force = result["extended_force"]  # (nf, nall_padded, 3)
+            # mapping may be padded; only use actual_nall entries
+            map_actual = mapping[:, :actual_nall]  # (nf, actual_nall)
+            ext_force_actual = ext_force[:, :actual_nall, :]  # (nf, actual_nall, 3)
+            # scatter-sum extended forces onto local atoms
+            idx = map_actual.unsqueeze(-1).expand_as(
+                ext_force_actual
+            )  # (nf, actual_nall, 3)
+            force = torch.zeros(
+                nframes, nloc, 3, dtype=ext_force.dtype, device=ext_force.device
+            )
+            force.scatter_add_(1, idx, ext_force_actual)
+            out["force"] = force
         if "virial" in result:
             out["virial"] = result["virial"]
         if "extended_virial" in result:
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 1943f67915..4db9c09af1 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -232,6 +232,105 @@ def test_nall_growth_triggers_recompile(self) -> None:
             shutil.rmtree(tmpdir, ignore_errors=True)
 
 
+class TestCompiledConsistency(unittest.TestCase):
+    """Verify compiled model produces the same energy/force/virial as uncompiled."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def test_compiled_matches_uncompiled(self) -> None:
+        """Energy, force, virial from compiled model must match uncompiled."""
+        from deepmd.pt_expt.train.training import (
+            _CompiledModel,
+        )
+
+        config = _make_config(self.data_dir, numb_steps=1)
+        # enable virial in loss so the model returns it
+        config["loss"]["start_pref_v"] = 1.0
+        config["loss"]["limit_pref_v"] = 1.0
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_consistency_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                trainer = get_trainer(config)
+                # Uncompiled model reference
+                uncompiled_model = trainer.model
+                uncompiled_model.eval()
+
+                # Build compiled model from the same weights
+                config_compiled = _make_config(self.data_dir, numb_steps=1)
+                config_compiled["loss"]["start_pref_v"] = 1.0
+                config_compiled["loss"]["limit_pref_v"] = 1.0
+                config_compiled["training"]["enable_compile"] = True
+                config_compiled = update_deepmd_input(config_compiled, warning=False)
+                config_compiled = normalize(config_compiled)
+                trainer_compiled = get_trainer(config_compiled)
+                compiled_model = trainer_compiled.wrapper.model
+                self.assertIsInstance(compiled_model, _CompiledModel)
+
+                # Copy uncompiled weights to compiled model so they match
+                compiled_model.original_model.load_state_dict(
+                    uncompiled_model.state_dict()
+                )
+                compiled_model.eval()
+
+                # Get a batch and run both models
+                input_dict, _ = trainer.get_data(is_train=True)
+                coord = input_dict["coord"].detach()
+                atype = input_dict["atype"].detach()
+                box = input_dict.get("box")
+                if box is not None:
+                    box = box.detach()
+
+                # Force is computed via autograd.grad inside the model, so
+                # we cannot use torch.no_grad() here.
+                coord_uc = coord.clone().requires_grad_(True)
+                pred_uc = uncompiled_model(coord_uc, atype, box)
+
+                pred_c = compiled_model(coord.clone(), atype, box)
+
+                # Energy
+                torch.testing.assert_close(
+                    pred_c["energy"],
+                    pred_uc["energy"],
+                    atol=1e-10,
+                    rtol=1e-10,
+                    msg="energy mismatch between compiled and uncompiled",
+                )
+                # Force
+                self.assertIn("force", pred_c, "compiled model missing 'force'")
+                self.assertIn("force", pred_uc, "uncompiled model missing 'force'")
+                torch.testing.assert_close(
+                    pred_c["force"],
+                    pred_uc["force"],
+                    atol=1e-10,
+                    rtol=1e-10,
+                    msg="force mismatch between compiled and uncompiled",
+                )
+                # Virial
+                if "virial" in pred_uc:
+                    self.assertIn("virial", pred_c, "compiled model missing 'virial'")
+                    torch.testing.assert_close(
+                        pred_c["virial"],
+                        pred_uc["virial"],
+                        atol=1e-10,
+                        rtol=1e-10,
+                        msg="virial mismatch between compiled and uncompiled",
+                    )
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
 class TestGetData(unittest.TestCase):
     """Test the batch data conversion in Trainer.get_data."""
 

From fc980d5b1dec12cf6dec8e06da7ad78d755c7137 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Fri, 27 Feb 2026 23:22:21 +0800
Subject: [PATCH 55/63] fix the rmse_v inconsistency but in the dp backend.
 improve the consistency ut for checking all loss terms.

---
 deepmd/dpmodel/loss/ener.py               |  2 +-
 source/tests/consistent/common.py         | 73 ++++++++++++++---------
 source/tests/consistent/loss/test_ener.py | 13 +++-
 3 files changed, 57 insertions(+), 31 deletions(-)

diff --git a/deepmd/dpmodel/loss/ener.py b/deepmd/dpmodel/loss/ener.py
index e512072509..9ab141bdc2 100644
--- a/deepmd/dpmodel/loss/ener.py
+++ b/deepmd/dpmodel/loss/ener.py
@@ -212,7 +212,7 @@ def call(
                 )
                 loss += pref_v * l_huber_loss
             more_loss["rmse_v"] = self.display_if_exist(
-                xp.sqrt(l2_virial_loss), find_virial
+                xp.sqrt(l2_virial_loss) * atom_norm, find_virial
             )
         if self.has_ae:
             atom_ener_reshape = xp.reshape(atom_ener, (-1,))
diff --git a/source/tests/consistent/common.py b/source/tests/consistent/common.py
index 76b7e9cb53..1d08fe67c9 100644
--- a/source/tests/consistent/common.py
+++ b/source/tests/consistent/common.py
@@ -238,7 +238,9 @@ class RefBackend(Enum):
         ARRAY_API_STRICT = 7
 
     @abstractmethod
-    def extract_ret(self, ret: Any, backend: RefBackend) -> tuple[np.ndarray, ...]:
+    def extract_ret(
+        self, ret: Any, backend: RefBackend
+    ) -> tuple[np.ndarray, ...] | dict[str, np.ndarray]:
         """Extract the return value when comparing with other backends.
 
         Parameters
@@ -250,10 +252,43 @@ def extract_ret(self, ret: Any, backend: RefBackend) -> tuple[np.ndarray, ...]:
 
         Returns
         -------
-        tuple[np.ndarray, ...]
-            The extracted return value
+        tuple[np.ndarray, ...] | dict[str, np.ndarray]
+            The extracted return value. If a dict is returned, keys are used
+            in error messages to identify which value mismatches.
         """
 
+    def _compare_ret(self, ret1, ret2) -> None:
+        """Compare two extracted return values (tuple or dict).
+
+        For dicts, keys must match exactly unless one dict contains only
+        ``"loss"`` (e.g. TF backend), in which case only ``"loss"`` is compared.
+        """
+        if isinstance(ret1, dict) and isinstance(ret2, dict):
+            keys1, keys2 = sorted(ret1.keys()), sorted(ret2.keys())
+            if keys1 == ["loss"] or keys2 == ["loss"]:
+                compare_keys = ["loss"]
+            else:
+                self.assertEqual(
+                    keys1,
+                    keys2,
+                    f"Keys mismatch: {keys1} vs {keys2}",
+                )
+                compare_keys = keys1
+            for key in compare_keys:
+                rr1, rr2 = ret1[key], ret2[key]
+                if rr1 is SKIP_FLAG or rr2 is SKIP_FLAG:
+                    continue
+                np.testing.assert_allclose(
+                    rr1, rr2, rtol=self.rtol, atol=self.atol, err_msg=f"key: {key}"
+                )
+                assert rr1.dtype == rr2.dtype, f"key {key}: {rr1.dtype} != {rr2.dtype}"
+        else:
+            for rr1, rr2 in zip(ret1, ret2, strict=True):
+                if rr1 is SKIP_FLAG or rr2 is SKIP_FLAG:
+                    continue
+                np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
+                assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+
     def build_eval_tf(
         self, sess: "tf.Session", obj: Any, suffix: str
     ) -> list[np.ndarray]:
@@ -388,11 +423,7 @@ def test_tf_consistent_with_ref(self) -> None:
         data2.pop("@version")
 
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(
-                rr1.ravel(), rr2.ravel(), rtol=self.rtol, atol=self.atol
-            )
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     def test_tf_self_consistent(self) -> None:
         """Test whether TF is self consistent."""
@@ -424,11 +455,7 @@ def test_dp_consistent_with_ref(self) -> None:
         ret2 = self.extract_ret(ret2, self.RefBackend.DP)
         data2 = dp_obj.serialize()
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            if rr1 is SKIP_FLAG or rr2 is SKIP_FLAG:
-                continue
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     @unittest.skipIf(TEST_DEVICE != "cpu" and CI, "Only test on CPU.")
     def test_dp_self_consistent(self) -> None:
@@ -469,9 +496,7 @@ def test_pt_consistent_with_ref(self) -> None:
         data1.pop("@variables", None)
         data2.pop("@variables", None)
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     def test_pt_self_consistent(self) -> None:
         """Test whether PT is self consistent."""
@@ -510,9 +535,7 @@ def test_pt_expt_consistent_with_ref(self) -> None:
         data1.pop("@variables", None)
         data2.pop("@variables", None)
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     def test_pt_expt_self_consistent(self) -> None:
         """Test whether PT exportable is self consistent."""
@@ -547,9 +570,7 @@ def test_jax_consistent_with_ref(self) -> None:
         data1.pop("@variables", None)
         data2.pop("@variables", None)
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     def test_jax_self_consistent(self) -> None:
         """Test whether JAX is self consistent."""
@@ -589,9 +610,7 @@ def test_pd_consistent_with_ref(self):
         data1.pop("@variables", None)
         data2.pop("@variables", None)
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     def test_pd_self_consistent(self):
         """Test whether PD is self consistent."""
@@ -624,9 +643,7 @@ def test_array_api_strict_consistent_with_ref(self) -> None:
         ret2 = self.extract_ret(ret2, self.RefBackend.ARRAY_API_STRICT)
         data2 = array_api_strict_obj.serialize()
         np.testing.assert_equal(data1, data2)
-        for rr1, rr2 in zip(ret1, ret2, strict=True):
-            np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
-            assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
+        self._compare_ret(ret1, ret2)
 
     @unittest.skipIf(TEST_DEVICE != "cpu" and CI, "Only test on CPU.")
     def test_array_api_strict_self_consistent(self) -> None:
diff --git a/source/tests/consistent/loss/test_ener.py b/source/tests/consistent/loss/test_ener.py
index b23ab1c01c..1cc662fc5b 100644
--- a/source/tests/consistent/loss/test_ener.py
+++ b/source/tests/consistent/loss/test_ener.py
@@ -251,8 +251,17 @@ def eval_pd(self, pd_obj: Any) -> Any:
         more_loss = {kk: to_numpy_array(vv) for kk, vv in more_loss.items()}
         return loss, more_loss
 
-    def extract_ret(self, ret: Any, backend) -> tuple[np.ndarray, ...]:
-        return (ret[0],)
+    def extract_ret(self, ret: Any, backend) -> dict[str, np.ndarray]:
+        loss = ret[0]
+        result = {"loss": np.atleast_1d(np.asarray(loss, dtype=np.float64))}
+        if len(ret) > 1:
+            more_loss = ret[1]
+            for k in sorted(more_loss):
+                if k.startswith("rmse_"):
+                    result[k] = np.atleast_1d(
+                        np.asarray(more_loss[k], dtype=np.float64)
+                    )
+        return result
 
     @property
     def rtol(self) -> float:

From 3656a6995c477d770808a6d7f90658209ace6a68 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sat, 28 Feb 2026 00:17:19 +0800
Subject: [PATCH 56/63] fix tests

---
 source/tests/consistent/model/test_dipole.py | 14 +++++++++++++-
 source/tests/consistent/model/test_ener.py   | 14 +++++++++++++-
 source/tests/consistent/model/test_polar.py  | 14 +++++++++++++-
 3 files changed, 39 insertions(+), 3 deletions(-)

diff --git a/source/tests/consistent/model/test_dipole.py b/source/tests/consistent/model/test_dipole.py
index 76251af6d2..7ea45496bc 100644
--- a/source/tests/consistent/model/test_dipole.py
+++ b/source/tests/consistent/model/test_dipole.py
@@ -1346,6 +1346,7 @@ def setUp(self) -> None:
             "dipole": dipole_stat,
             "find_dipole": np.float32(1.0),
             "aparam": aparam_stat,
+            "find_aparam": np.float32(1.0),
         }
         # pt sample (torch tensors)
         pt_sample = {
@@ -1357,6 +1358,7 @@ def setUp(self) -> None:
             "dipole": numpy_to_torch(dipole_stat),
             "find_dipole": np.float32(1.0),
             "aparam": numpy_to_torch(aparam_stat),
+            "find_aparam": np.float32(1.0),
         }
 
         if self.fparam_in_data:
@@ -1365,9 +1367,19 @@ def setUp(self) -> None:
             )
             np_sample["fparam"] = fparam_stat
             pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            np_sample["find_fparam"] = np.float32(1.0)
+            pt_sample["find_fparam"] = np.float32(1.0)
             self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
         else:
-            # No fparam → _make_wrapped_sampler injects default_fparam
+            # No fparam in data.  dpmodel keeps zero-padded fparam with
+            # find_fparam=0; _make_wrapped_sampler injects default_fparam.
+            np_sample["fparam"] = np.zeros(
+                (nframes, 2), dtype=GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["find_fparam"] = np.float32(0.0)
+            # pt pipeline pops fparam/find_fparam (stat.py), then
+            # wrapped_sampler injects default_fparam when keys are absent.
+            # pt_sample has no fparam/find_fparam keys.
             self.expected_fparam_avg = np.array([0.5, -0.3])
 
         self.np_sampled = [np_sample]
diff --git a/source/tests/consistent/model/test_ener.py b/source/tests/consistent/model/test_ener.py
index f47365e2cf..1229b2763d 100644
--- a/source/tests/consistent/model/test_ener.py
+++ b/source/tests/consistent/model/test_ener.py
@@ -1636,6 +1636,7 @@ def setUp(self) -> None:
             "energy": energy_stat,
             "find_energy": np.float32(1.0),
             "aparam": aparam_stat,
+            "find_aparam": np.float32(1.0),
         }
         # pt sample (torch tensors)
         pt_sample = {
@@ -1647,6 +1648,7 @@ def setUp(self) -> None:
             "energy": numpy_to_torch(energy_stat),
             "find_energy": np.float32(1.0),
             "aparam": numpy_to_torch(aparam_stat),
+            "find_aparam": np.float32(1.0),
         }
 
         if self.fparam_in_data:
@@ -1655,9 +1657,19 @@ def setUp(self) -> None:
             )
             np_sample["fparam"] = fparam_stat
             pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            np_sample["find_fparam"] = np.float32(1.0)
+            pt_sample["find_fparam"] = np.float32(1.0)
             self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
         else:
-            # No fparam → _make_wrapped_sampler injects default_fparam
+            # No fparam in data.  dpmodel keeps zero-padded fparam with
+            # find_fparam=0; _make_wrapped_sampler injects default_fparam.
+            np_sample["fparam"] = np.zeros(
+                (nframes, 2), dtype=GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["find_fparam"] = np.float32(0.0)
+            # pt pipeline pops fparam/find_fparam (stat.py), then
+            # wrapped_sampler injects default_fparam when keys are absent.
+            # pt_sample has no fparam/find_fparam keys.
             self.expected_fparam_avg = np.array([0.5, -0.3])
 
         self.np_sampled = [np_sample]
diff --git a/source/tests/consistent/model/test_polar.py b/source/tests/consistent/model/test_polar.py
index 93e696596e..80d75edfae 100644
--- a/source/tests/consistent/model/test_polar.py
+++ b/source/tests/consistent/model/test_polar.py
@@ -1340,6 +1340,7 @@ def setUp(self) -> None:
             "polarizability": polar_stat,
             "find_polarizability": np.float32(1.0),
             "aparam": aparam_stat,
+            "find_aparam": np.float32(1.0),
         }
         # pt sample (torch tensors)
         pt_sample = {
@@ -1351,6 +1352,7 @@ def setUp(self) -> None:
             "polarizability": numpy_to_torch(polar_stat),
             "find_polarizability": np.float32(1.0),
             "aparam": numpy_to_torch(aparam_stat),
+            "find_aparam": np.float32(1.0),
         }
 
         if self.fparam_in_data:
@@ -1359,9 +1361,19 @@ def setUp(self) -> None:
             )
             np_sample["fparam"] = fparam_stat
             pt_sample["fparam"] = numpy_to_torch(fparam_stat)
+            np_sample["find_fparam"] = np.float32(1.0)
+            pt_sample["find_fparam"] = np.float32(1.0)
             self.expected_fparam_avg = np.mean(fparam_stat, axis=0)
         else:
-            # No fparam → _make_wrapped_sampler injects default_fparam
+            # No fparam in data.  dpmodel keeps zero-padded fparam with
+            # find_fparam=0; _make_wrapped_sampler injects default_fparam.
+            np_sample["fparam"] = np.zeros(
+                (nframes, 2), dtype=GLOBAL_NP_FLOAT_PRECISION
+            )
+            np_sample["find_fparam"] = np.float32(0.0)
+            # pt pipeline pops fparam/find_fparam (stat.py), then
+            # wrapped_sampler injects default_fparam when keys are absent.
+            # pt_sample has no fparam/find_fparam keys.
             self.expected_fparam_avg = np.array([0.5, -0.3])
 
         self.np_sampled = [np_sample]

From 429bae64bd450b4a48b0d6a98b22285426515af1 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Sun, 1 Mar 2026 23:38:28 +0800
Subject: [PATCH 57/63] fix ut

---
 source/tests/consistent/common.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/source/tests/consistent/common.py b/source/tests/consistent/common.py
index 1d08fe67c9..ed4e2caab9 100644
--- a/source/tests/consistent/common.py
+++ b/source/tests/consistent/common.py
@@ -286,7 +286,9 @@ def _compare_ret(self, ret1, ret2) -> None:
             for rr1, rr2 in zip(ret1, ret2, strict=True):
                 if rr1 is SKIP_FLAG or rr2 is SKIP_FLAG:
                     continue
-                np.testing.assert_allclose(rr1, rr2, rtol=self.rtol, atol=self.atol)
+                np.testing.assert_allclose(
+                    rr1.ravel(), rr2.ravel(), rtol=self.rtol, atol=self.atol
+                )
                 assert rr1.dtype == rr2.dtype, f"{rr1.dtype} != {rr2.dtype}"
 
     def build_eval_tf(

From fb2eb428126a0d784218ee99c3a85ce08fa679be Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 2 Mar 2026 09:08:48 +0800
Subject: [PATCH 58/63] fix bug

---
 source/tests/common/dpmodel/test_fitting_stat.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/source/tests/common/dpmodel/test_fitting_stat.py b/source/tests/common/dpmodel/test_fitting_stat.py
index 101d2a9ad7..498124bd43 100644
--- a/source/tests/common/dpmodel/test_fitting_stat.py
+++ b/source/tests/common/dpmodel/test_fitting_stat.py
@@ -33,7 +33,9 @@ def _make_fake_data_pt(sys_natoms, sys_nframes, avgs, stds):
         tmp_data_f = np.transpose(tmp_data_f, (1, 2, 0))
         tmp_data_a = np.transpose(tmp_data_a, (1, 2, 0))
         sys_dict["fparam"] = tmp_data_f
+        sys_dict["find_fparam"] = np.float32(1.0)
         sys_dict["aparam"] = tmp_data_a
+        sys_dict["find_aparam"] = np.float32(1.0)
         merged_output_stat.append(sys_dict)
     return merged_output_stat
 

From 9b430a457fab32e79ae7bac19d9e86a8a262bc19 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 2 Mar 2026 16:16:08 +0800
Subject: [PATCH 59/63] add training ut for dpa3 model

---
 source/tests/pt_expt/test_training.py | 118 ++++++++++++++++++++++++++
 1 file changed, 118 insertions(+)

diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 4db9c09af1..5d22f3463b 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -374,5 +374,123 @@ def test_batch_shapes(self) -> None:
             shutil.rmtree(tmpdir, ignore_errors=True)
 
 
+def _make_dpa3_config(data_dir: str, numb_steps: int = 5) -> dict:
+    """Build a minimal DPA3 config dict pointing at *data_dir*."""
+    config = {
+        "model": {
+            "type_map": ["O", "H"],
+            "descriptor": {
+                "type": "dpa3",
+                "repflow": {
+                    "n_dim": 8,
+                    "e_dim": 4,
+                    "a_dim": 4,
+                    "nlayers": 2,
+                    "e_rcut": 3.0,
+                    "e_rcut_smth": 0.5,
+                    "e_sel": 18,
+                    "a_rcut": 2.5,
+                    "a_rcut_smth": 0.5,
+                    "a_sel": 10,
+                    "axis_neuron": 4,
+                    "fix_stat_std": 0.3,
+                },
+                "seed": 1,
+            },
+            "fitting_net": {
+                "neuron": [8, 8],
+                "resnet_dt": True,
+                "seed": 1,
+            },
+            "data_stat_nbatch": 1,
+        },
+        "learning_rate": {
+            "type": "exp",
+            "decay_steps": 500,
+            "start_lr": 0.001,
+            "stop_lr": 3.51e-8,
+        },
+        "loss": {
+            "type": "ener",
+            "start_pref_e": 0.02,
+            "limit_pref_e": 1,
+            "start_pref_f": 1000,
+            "limit_pref_f": 1,
+            "start_pref_v": 0,
+            "limit_pref_v": 0,
+        },
+        "training": {
+            "training_data": {
+                "systems": [
+                    os.path.join(data_dir, "data_0"),
+                ],
+                "batch_size": 1,
+            },
+            "validation_data": {
+                "systems": [
+                    os.path.join(data_dir, "data_3"),
+                ],
+                "batch_size": 1,
+                "numb_btch": 1,
+            },
+            "numb_steps": numb_steps,
+            "seed": 10,
+            "disp_file": "lcurve.out",
+            "disp_freq": 5,
+            "save_freq": numb_steps,
+        },
+    }
+    return config
+
+
+class TestTrainingDPA3(unittest.TestCase):
+    """Smoke test for the pt_expt training loop with DPA3 descriptor."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def test_get_model(self) -> None:
+        """Test that get_model constructs a DPA3 model from config."""
+        config = _make_dpa3_config(self.data_dir)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+        model = get_model(config["model"])
+        self.assertIsInstance(model, torch.nn.Module)
+        nparams = sum(p.numel() for p in model.parameters())
+        self.assertGreater(nparams, 0)
+
+    def test_training_loop(self) -> None:
+        """Run a few DPA3 training steps and verify outputs."""
+        config = _make_dpa3_config(self.data_dir, numb_steps=5)
+        config = update_deepmd_input(config, warning=False)
+        config = normalize(config)
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_dpa3_train_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                trainer = get_trainer(config)
+                trainer.run()
+
+                lcurve_path = os.path.join(tmpdir, "lcurve.out")
+                self.assertTrue(os.path.exists(lcurve_path), "lcurve.out not created")
+
+                with open(lcurve_path) as f:
+                    lines = [l for l in f.readlines() if not l.startswith("#")]
+                self.assertGreater(len(lines), 0, "lcurve.out is empty")
+
+                ckpt_files = [f for f in os.listdir(tmpdir) if f.endswith(".pt")]
+                self.assertGreater(len(ckpt_files), 0, "No checkpoint files saved")
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
 if __name__ == "__main__":
     unittest.main()

From cb9f55b2e47044218b7455d403423e7c3c071e0c Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 2 Mar 2026 18:30:06 +0800
Subject: [PATCH 60/63] fix: load checkpoint before torch.compile to support
 restart

  _compile_model() wraps self.wrapper.model with _CompiledModel, changing
  state_dict keys from model.* to model.original_model.*. When this ran
  before the resume block, load_state_dict would fail on checkpoints saved
  from uncompiled training. Move the compile block after resume so
  checkpoint keys always match, then wrap the restored model.

  Add restart/init_model/restart+compile tests and DPA3 training test.
---
 deepmd/pt_expt/train/training.py      |  28 +++---
 source/tests/pt_expt/test_training.py | 121 ++++++++++++++++++++++++++
 2 files changed, 135 insertions(+), 14 deletions(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 5b80556197..03aa586b31 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -467,20 +467,6 @@ def get_sample() -> list[dict[str, np.ndarray]]:
             last_epoch=self.start_step - 1,
         )
 
-        # torch.compile -------------------------------------------------------
-        # The model's forward uses torch.autograd.grad (for forces) with
-        # create_graph=True so the loss backward can differentiate through
-        # forces.  torch.compile does not support this "double backward".
-        #
-        # Solution: use make_fx to trace the model forward, which decomposes
-        # torch.autograd.grad into primitive ops.  The resulting traced
-        # module is then compiled by torch.compile — no double backward.
-        self.enable_compile = training_params.get("enable_compile", False)
-        if self.enable_compile:
-            compile_opts = training_params.get("compile_options", {})
-            log.info("Compiling model with torch.compile (%s)", compile_opts)
-            self._compile_model(compile_opts)
-
         # Resume --------------------------------------------------------------
         if resuming:
             log.info(f"Resuming from {resume_model}.")
@@ -512,6 +498,20 @@ def get_sample() -> list[dict[str, np.ndarray]]:
                     last_epoch=self.start_step - 1,
                 )
 
+        # torch.compile -------------------------------------------------------
+        # The model's forward uses torch.autograd.grad (for forces) with
+        # create_graph=True so the loss backward can differentiate through
+        # forces.  torch.compile does not support this "double backward".
+        #
+        # Solution: use make_fx to trace the model forward, which decomposes
+        # torch.autograd.grad into primitive ops.  The resulting traced
+        # module is then compiled by torch.compile — no double backward.
+        self.enable_compile = training_params.get("enable_compile", False)
+        if self.enable_compile:
+            compile_opts = training_params.get("compile_options", {})
+            log.info("Compiling model with torch.compile (%s)", compile_opts)
+            self._compile_model(compile_opts)
+
     # ------------------------------------------------------------------
     # torch.compile helpers
     # ------------------------------------------------------------------
diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 5d22f3463b..5a17ca316f 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -374,6 +374,127 @@ def test_batch_shapes(self) -> None:
             shutil.rmtree(tmpdir, ignore_errors=True)
 
 
+class TestRestart(unittest.TestCase):
+    """Test restart and init_model resume paths."""
+
+    @classmethod
+    def setUpClass(cls) -> None:
+        data_dir = os.path.join(EXAMPLE_DIR, "data")
+        if not os.path.isdir(data_dir):
+            raise unittest.SkipTest(f"Example data not found: {data_dir}")
+        cls.data_dir = data_dir
+
+    def _train_and_get_ckpt(self, config: dict, tmpdir: str) -> str:
+        """Train and return the path to the final checkpoint."""
+        trainer = get_trainer(config)
+        trainer.run()
+        # find the latest checkpoint symlink
+        ckpt = os.path.join(tmpdir, "model.ckpt.pt")
+        self.assertTrue(os.path.exists(ckpt), "Checkpoint not created")
+        return ckpt
+
+    def test_restart(self) -> None:
+        """Train 5 steps, restart from checkpoint, train 5 more."""
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_restart_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                # Phase 1: train 5 steps
+                config = _make_config(self.data_dir, numb_steps=5)
+                config = update_deepmd_input(config, warning=False)
+                config = normalize(config)
+                ckpt_path = self._train_and_get_ckpt(config, tmpdir)
+
+                # Phase 2: restart from checkpoint, train to step 10
+                config2 = _make_config(self.data_dir, numb_steps=10)
+                config2 = update_deepmd_input(config2, warning=False)
+                config2 = normalize(config2)
+                trainer2 = get_trainer(config2, restart_model=ckpt_path)
+
+                # start_step should be restored
+                self.assertEqual(trainer2.start_step, 5)
+                trainer2.run()
+
+                # lcurve should have entries appended (restart opens in append mode)
+                with open(os.path.join(tmpdir, "lcurve.out")) as f:
+                    lines = [l for l in f.readlines() if not l.startswith("#")]
+                self.assertGreater(len(lines), 0, "lcurve.out is empty after restart")
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+    def test_init_model(self) -> None:
+        """Train 5 steps, init_model from checkpoint (reset step), train 5 more."""
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_init_model_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                # Phase 1: train 5 steps
+                config = _make_config(self.data_dir, numb_steps=5)
+                config = update_deepmd_input(config, warning=False)
+                config = normalize(config)
+                ckpt_path = self._train_and_get_ckpt(config, tmpdir)
+
+                # Phase 2: init_model — weights loaded but step reset to 0
+                config2 = _make_config(self.data_dir, numb_steps=5)
+                config2 = update_deepmd_input(config2, warning=False)
+                config2 = normalize(config2)
+                trainer2 = get_trainer(config2, init_model=ckpt_path)
+
+                # init_model resets step to 0
+                self.assertEqual(trainer2.start_step, 0)
+                trainer2.run()
+
+                with open(os.path.join(tmpdir, "lcurve.out")) as f:
+                    lines = [l for l in f.readlines() if not l.startswith("#")]
+                self.assertGreater(
+                    len(lines), 0, "lcurve.out is empty after init_model"
+                )
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+    def test_restart_with_compile(self) -> None:
+        """Train uncompiled, restart with compile enabled."""
+        from deepmd.pt_expt.train.training import (
+            _CompiledModel,
+        )
+
+        tmpdir = tempfile.mkdtemp(prefix="pt_expt_restart_compile_")
+        try:
+            old_cwd = os.getcwd()
+            os.chdir(tmpdir)
+            try:
+                # Phase 1: train 5 steps without compile
+                config = _make_config(self.data_dir, numb_steps=5)
+                config = update_deepmd_input(config, warning=False)
+                config = normalize(config)
+                ckpt_path = self._train_and_get_ckpt(config, tmpdir)
+
+                # Phase 2: restart with compile enabled
+                config2 = _make_config(self.data_dir, numb_steps=10)
+                config2["training"]["enable_compile"] = True
+                config2 = update_deepmd_input(config2, warning=False)
+                config2 = normalize(config2)
+                trainer2 = get_trainer(config2, restart_model=ckpt_path)
+
+                self.assertEqual(trainer2.start_step, 5)
+                self.assertIsInstance(trainer2.wrapper.model, _CompiledModel)
+                trainer2.run()
+
+                with open(os.path.join(tmpdir, "lcurve.out")) as f:
+                    lines = [l for l in f.readlines() if not l.startswith("#")]
+                self.assertGreater(len(lines), 0)
+            finally:
+                os.chdir(old_cwd)
+        finally:
+            shutil.rmtree(tmpdir, ignore_errors=True)
+
+
 def _make_dpa3_config(data_dir: str, numb_steps: int = 5) -> dict:
     """Build a minimal DPA3 config dict pointing at *data_dir*."""
     config = {

From 9793548f81a43907c91fd6fb7045af7aab25a613 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 2 Mar 2026 18:37:47 +0800
Subject: [PATCH 61/63] fix: remove + self.start_step from both lambdas, since
 last_epoch already handles the offset.

---
 deepmd/pt_expt/train/training.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/deepmd/pt_expt/train/training.py b/deepmd/pt_expt/train/training.py
index 03aa586b31..f8730ed271 100644
--- a/deepmd/pt_expt/train/training.py
+++ b/deepmd/pt_expt/train/training.py
@@ -463,7 +463,7 @@ def get_sample() -> list[dict[str, np.ndarray]]:
 
         self.scheduler = torch.optim.lr_scheduler.LambdaLR(
             self.optimizer,
-            lambda step: self.lr_schedule.value(step + self.start_step) / initial_lr,
+            lambda step: self.lr_schedule.value(step) / initial_lr,
             last_epoch=self.start_step - 1,
         )
 
@@ -489,12 +489,12 @@ def get_sample() -> list[dict[str, np.ndarray]]:
             self.wrapper.load_state_dict(state_dict)
             if optimizer_state_dict is not None:
                 self.optimizer.load_state_dict(optimizer_state_dict)
-                # rebuild scheduler from the resumed step
+                # rebuild scheduler from the resumed step.
+                # last_epoch handles the step offset; the lambda must NOT
+                # add self.start_step again (that would double-count).
                 self.scheduler = torch.optim.lr_scheduler.LambdaLR(
                     self.optimizer,
-                    lambda step: (
-                        self.lr_schedule.value(step + self.start_step) / initial_lr
-                    ),
+                    lambda step: self.lr_schedule.value(step) / initial_lr,
                     last_epoch=self.start_step - 1,
                 )
 

From 99c02213908d887c18e3fe4b133daa64efe8226c Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Mon, 2 Mar 2026 18:38:40 +0800
Subject: [PATCH 62/63] add ut

---
 source/tests/pt_expt/test_training.py | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/source/tests/pt_expt/test_training.py b/source/tests/pt_expt/test_training.py
index 5a17ca316f..3b3ab247bb 100644
--- a/source/tests/pt_expt/test_training.py
+++ b/source/tests/pt_expt/test_training.py
@@ -414,6 +414,19 @@ def test_restart(self) -> None:
 
                 # start_step should be restored
                 self.assertEqual(trainer2.start_step, 5)
+
+                # LR should match the schedule at the resumed step,
+                # not double-count start_step.
+                expected_lr = trainer2.lr_schedule.value(trainer2.start_step)
+                actual_lr = trainer2.scheduler.get_last_lr()[0]
+                self.assertAlmostEqual(
+                    actual_lr,
+                    expected_lr,
+                    places=10,
+                    msg=f"LR after restart should be lr_schedule({trainer2.start_step})"
+                    f"={expected_lr}, got {actual_lr}",
+                )
+
                 trainer2.run()
 
                 # lcurve should have entries appended (restart opens in append mode)

From f0f260d873698a9cc5232221b25b8de402ab2504 Mon Sep 17 00:00:00 2001
From: Han Wang <wang_han@iapcm.ac.cn>
Date: Tue, 3 Mar 2026 15:44:11 +0800
Subject: [PATCH 63/63] feat(pt_expt): run update_sel neighbor statistics on
 GPU

  Introduce a _update_sel_cls class variable on dpmodel descriptors so
  that each backend can supply its own UpdateSel / NeighborStat.  The
  dpmodel default stays on CPU (numpy); pt_expt overrides the class
  variable with a GPU-aware UpdateSel backed by a @torch_module-wrapped
  NeighborStatOP, so array_api_compat dispatches to torch on DEVICE.
---
 deepmd/dpmodel/descriptor/dpa1.py        |  4 +-
 deepmd/dpmodel/descriptor/dpa2.py        |  4 +-
 deepmd/dpmodel/descriptor/dpa3.py        |  4 +-
 deepmd/dpmodel/descriptor/se_e2_a.py     |  4 +-
 deepmd/dpmodel/descriptor/se_r.py        |  4 +-
 deepmd/dpmodel/descriptor/se_t.py        |  4 +-
 deepmd/dpmodel/descriptor/se_t_tebd.py   |  4 +-
 deepmd/pt_expt/descriptor/dpa1.py        |  5 +-
 deepmd/pt_expt/descriptor/dpa2.py        |  5 +-
 deepmd/pt_expt/descriptor/dpa3.py        |  5 +-
 deepmd/pt_expt/descriptor/se_atten_v2.py |  5 +-
 deepmd/pt_expt/descriptor/se_e2_a.py     |  5 +-
 deepmd/pt_expt/descriptor/se_r.py        |  5 +-
 deepmd/pt_expt/descriptor/se_t.py        |  5 +-
 deepmd/pt_expt/descriptor/se_t_tebd.py   |  5 +-
 deepmd/pt_expt/utils/neighbor_stat.py    | 88 ++++++++++++++++++++++++
 deepmd/pt_expt/utils/update_sel.py       | 14 ++++
 17 files changed, 155 insertions(+), 15 deletions(-)
 create mode 100644 deepmd/pt_expt/utils/neighbor_stat.py
 create mode 100644 deepmd/pt_expt/utils/update_sel.py

diff --git a/deepmd/dpmodel/descriptor/dpa1.py b/deepmd/dpmodel/descriptor/dpa1.py
index 34dcba6335..e0a9d47cac 100644
--- a/deepmd/dpmodel/descriptor/dpa1.py
+++ b/deepmd/dpmodel/descriptor/dpa1.py
@@ -242,6 +242,8 @@ class DescrptDPA1(NativeOP, BaseDescriptor):
        arXiv preprint arXiv:2208.08236.
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         rcut: float,
@@ -662,7 +664,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        min_nbor_dist, sel = UpdateSel().update_one_sel(
+        min_nbor_dist, sel = cls._update_sel_cls().update_one_sel(
             train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], True
         )
         local_jdata_cpy["sel"] = sel[0]
diff --git a/deepmd/dpmodel/descriptor/dpa2.py b/deepmd/dpmodel/descriptor/dpa2.py
index 5ac636c37c..44e88fa38a 100644
--- a/deepmd/dpmodel/descriptor/dpa2.py
+++ b/deepmd/dpmodel/descriptor/dpa2.py
@@ -441,6 +441,8 @@ class DescrptDPA2(NativeOP, BaseDescriptor):
        Comput Mater 10, 293 (2024). https://doi.org/10.1038/s41524-024-01493-2
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         ntypes: int,
@@ -1114,7 +1116,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        update_sel = UpdateSel()
+        update_sel = cls._update_sel_cls()
         min_nbor_dist, repinit_sel = update_sel.update_one_sel(
             train_data,
             type_map,
diff --git a/deepmd/dpmodel/descriptor/dpa3.py b/deepmd/dpmodel/descriptor/dpa3.py
index e385ae5dda..956607b114 100644
--- a/deepmd/dpmodel/descriptor/dpa3.py
+++ b/deepmd/dpmodel/descriptor/dpa3.py
@@ -337,6 +337,8 @@ class DescrptDPA3(NativeOP, BaseDescriptor):
        arXiv preprint arXiv:2506.01686 (2025).
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         ntypes: int,
@@ -729,7 +731,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        update_sel = UpdateSel()
+        update_sel = cls._update_sel_cls()
         min_nbor_dist, repflow_e_sel = update_sel.update_one_sel(
             train_data,
             type_map,
diff --git a/deepmd/dpmodel/descriptor/se_e2_a.py b/deepmd/dpmodel/descriptor/se_e2_a.py
index 4710987f54..3abdfe750f 100644
--- a/deepmd/dpmodel/descriptor/se_e2_a.py
+++ b/deepmd/dpmodel/descriptor/se_e2_a.py
@@ -149,6 +149,8 @@ class DescrptSeA(NativeOP, BaseDescriptor):
        Systems (NIPS'18). Curran Associates Inc., Red Hook, NY, USA, 4441-4451.
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         rcut: float,
@@ -582,7 +584,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        min_nbor_dist, local_jdata_cpy["sel"] = UpdateSel().update_one_sel(
+        min_nbor_dist, local_jdata_cpy["sel"] = cls._update_sel_cls().update_one_sel(
             train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], False
         )
         return local_jdata_cpy, min_nbor_dist
diff --git a/deepmd/dpmodel/descriptor/se_r.py b/deepmd/dpmodel/descriptor/se_r.py
index 5ea9ef525f..2fb0414633 100644
--- a/deepmd/dpmodel/descriptor/se_r.py
+++ b/deepmd/dpmodel/descriptor/se_r.py
@@ -128,6 +128,8 @@ class DescrptSeR(NativeOP, BaseDescriptor):
        Systems (NIPS'18). Curran Associates Inc., Red Hook, NY, USA, 4441-4451.
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         rcut: float,
@@ -505,7 +507,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        min_nbor_dist, local_jdata_cpy["sel"] = UpdateSel().update_one_sel(
+        min_nbor_dist, local_jdata_cpy["sel"] = cls._update_sel_cls().update_one_sel(
             train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], False
         )
         return local_jdata_cpy, min_nbor_dist
diff --git a/deepmd/dpmodel/descriptor/se_t.py b/deepmd/dpmodel/descriptor/se_t.py
index 7877a1e9ab..6e1e30ab1e 100644
--- a/deepmd/dpmodel/descriptor/se_t.py
+++ b/deepmd/dpmodel/descriptor/se_t.py
@@ -116,6 +116,8 @@ class DescrptSeT(NativeOP, BaseDescriptor):
             Not used in this descriptor, only to be compat with input.
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         rcut: float,
@@ -505,7 +507,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        min_nbor_dist, local_jdata_cpy["sel"] = UpdateSel().update_one_sel(
+        min_nbor_dist, local_jdata_cpy["sel"] = cls._update_sel_cls().update_one_sel(
             train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], False
         )
         return local_jdata_cpy, min_nbor_dist
diff --git a/deepmd/dpmodel/descriptor/se_t_tebd.py b/deepmd/dpmodel/descriptor/se_t_tebd.py
index 994fa63b30..1687ff5ca7 100644
--- a/deepmd/dpmodel/descriptor/se_t_tebd.py
+++ b/deepmd/dpmodel/descriptor/se_t_tebd.py
@@ -141,6 +141,8 @@ class DescrptSeTTebd(NativeOP, BaseDescriptor):
 
     """
 
+    _update_sel_cls = UpdateSel
+
     def __init__(
         self,
         rcut: float,
@@ -500,7 +502,7 @@ def update_sel(
             The minimum distance between two atoms
         """
         local_jdata_cpy = local_jdata.copy()
-        min_nbor_dist, sel = UpdateSel().update_one_sel(
+        min_nbor_dist, sel = cls._update_sel_cls().update_one_sel(
             train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], True
         )
         local_jdata_cpy["sel"] = sel[0]
diff --git a/deepmd/pt_expt/descriptor/dpa1.py b/deepmd/pt_expt/descriptor/dpa1.py
index 3cef4ef78c..1bab33af8f 100644
--- a/deepmd/pt_expt/descriptor/dpa1.py
+++ b/deepmd/pt_expt/descriptor/dpa1.py
@@ -7,10 +7,13 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_atten")
 @BaseDescriptor.register("dpa1")
 @torch_module
 class DescrptDPA1(DescrptDPA1DP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/dpa2.py b/deepmd/pt_expt/descriptor/dpa2.py
index db60accaa1..ba7f03e9e6 100644
--- a/deepmd/pt_expt/descriptor/dpa2.py
+++ b/deepmd/pt_expt/descriptor/dpa2.py
@@ -7,9 +7,12 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("dpa2")
 @torch_module
 class DescrptDPA2(DescrptDPA2DP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/dpa3.py b/deepmd/pt_expt/descriptor/dpa3.py
index 82dc46a57f..7119f043bd 100644
--- a/deepmd/pt_expt/descriptor/dpa3.py
+++ b/deepmd/pt_expt/descriptor/dpa3.py
@@ -7,9 +7,12 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("dpa3")
 @torch_module
 class DescrptDPA3(DescrptDPA3DP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/se_atten_v2.py b/deepmd/pt_expt/descriptor/se_atten_v2.py
index b0ae833075..5be8b94ea2 100644
--- a/deepmd/pt_expt/descriptor/se_atten_v2.py
+++ b/deepmd/pt_expt/descriptor/se_atten_v2.py
@@ -7,9 +7,12 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_atten_v2")
 @torch_module
 class DescrptSeAttenV2(DescrptSeAttenV2DP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/se_e2_a.py b/deepmd/pt_expt/descriptor/se_e2_a.py
index fea695ebd9..d65682c200 100644
--- a/deepmd/pt_expt/descriptor/se_e2_a.py
+++ b/deepmd/pt_expt/descriptor/se_e2_a.py
@@ -7,10 +7,13 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_e2_a")
 @BaseDescriptor.register("se_a")
 @torch_module
 class DescrptSeA(DescrptSeADP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/se_r.py b/deepmd/pt_expt/descriptor/se_r.py
index a449614f47..a2456ff58e 100644
--- a/deepmd/pt_expt/descriptor/se_r.py
+++ b/deepmd/pt_expt/descriptor/se_r.py
@@ -7,10 +7,13 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_e2_r")
 @BaseDescriptor.register("se_r")
 @torch_module
 class DescrptSeR(DescrptSeRDP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/se_t.py b/deepmd/pt_expt/descriptor/se_t.py
index de76b4ecf7..9706f0ceb4 100644
--- a/deepmd/pt_expt/descriptor/se_t.py
+++ b/deepmd/pt_expt/descriptor/se_t.py
@@ -7,6 +7,9 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_e3")
@@ -14,4 +17,4 @@
 @BaseDescriptor.register("se_a_3be")
 @torch_module
 class DescrptSeT(DescrptSeTDP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/descriptor/se_t_tebd.py b/deepmd/pt_expt/descriptor/se_t_tebd.py
index 995dc24c3b..37c872ec64 100644
--- a/deepmd/pt_expt/descriptor/se_t_tebd.py
+++ b/deepmd/pt_expt/descriptor/se_t_tebd.py
@@ -7,9 +7,12 @@
 from deepmd.pt_expt.descriptor.base_descriptor import (
     BaseDescriptor,
 )
+from deepmd.pt_expt.utils.update_sel import (
+    UpdateSel,
+)
 
 
 @BaseDescriptor.register("se_e3_tebd")
 @torch_module
 class DescrptSeTTebd(DescrptSeTTebdDP):
-    pass
+    _update_sel_cls = UpdateSel
diff --git a/deepmd/pt_expt/utils/neighbor_stat.py b/deepmd/pt_expt/utils/neighbor_stat.py
new file mode 100644
index 0000000000..cf9d9f3c18
--- /dev/null
+++ b/deepmd/pt_expt/utils/neighbor_stat.py
@@ -0,0 +1,88 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+from collections.abc import (
+    Iterator,
+)
+
+import numpy as np
+import torch
+
+from deepmd.dpmodel.utils.neighbor_stat import NeighborStatOP as NeighborStatOPDP
+from deepmd.pt_expt.common import (
+    torch_module,
+)
+from deepmd.pt_expt.utils.env import (
+    DEVICE,
+)
+from deepmd.utils.data_system import (
+    DeepmdDataSystem,
+)
+from deepmd.utils.neighbor_stat import NeighborStat as BaseNeighborStat
+
+
+@torch_module
+class NeighborStatOP(NeighborStatOPDP):
+    pass
+
+
+class NeighborStat(BaseNeighborStat):
+    """Neighbor statistics using torch on DEVICE.
+
+    Parameters
+    ----------
+    ntypes : int
+        The num of atom types
+    rcut : float
+        The cut-off radius
+    mixed_type : bool, optional, default=False
+        Treat all types as a single type.
+    """
+
+    def __init__(
+        self,
+        ntypes: int,
+        rcut: float,
+        mixed_type: bool = False,
+    ) -> None:
+        super().__init__(ntypes, rcut, mixed_type)
+        self.op = NeighborStatOP(ntypes, rcut, mixed_type)
+
+    def iterator(
+        self, data: DeepmdDataSystem
+    ) -> Iterator[tuple[np.ndarray, float, str]]:
+        """Produce neighbor statistics for each data set.
+
+        Yields
+        ------
+        np.ndarray
+            The maximal number of neighbors
+        float
+            The squared minimal distance between two atoms
+        str
+            The directory of the data system
+        """
+        for ii in range(len(data.system_dirs)):
+            for jj in data.data_systems[ii].dirs:
+                data_set = data.data_systems[ii]
+                data_set_data = data_set._load_set(jj)
+                minrr2, max_nnei = self._execute(
+                    data_set_data["coord"],
+                    data_set_data["type"],
+                    data_set_data["box"] if data_set.pbc else None,
+                )
+                yield np.max(max_nnei, axis=0), np.min(minrr2), jj
+
+    def _execute(
+        self,
+        coord: np.ndarray,
+        atype: np.ndarray,
+        cell: np.ndarray | None,
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """Execute the operation on DEVICE."""
+        minrr2, max_nnei = self.op(
+            torch.from_numpy(coord).to(DEVICE),
+            torch.from_numpy(atype).to(DEVICE),
+            torch.from_numpy(cell).to(DEVICE) if cell is not None else None,
+        )
+        minrr2 = minrr2.detach().cpu().numpy()
+        max_nnei = max_nnei.detach().cpu().numpy()
+        return minrr2, max_nnei
diff --git a/deepmd/pt_expt/utils/update_sel.py b/deepmd/pt_expt/utils/update_sel.py
new file mode 100644
index 0000000000..20d3ef9da1
--- /dev/null
+++ b/deepmd/pt_expt/utils/update_sel.py
@@ -0,0 +1,14 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+
+from deepmd.pt_expt.utils.neighbor_stat import (
+    NeighborStat,
+)
+from deepmd.utils.update_sel import (
+    BaseUpdateSel,
+)
+
+
+class UpdateSel(BaseUpdateSel):
+    @property
+    def neighbor_stat(self) -> type[NeighborStat]:
+        return NeighborStat