deepmodeling
diff --git a/‎.github/workflows/test_cuda.yml‎
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/test_cuda.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎deepmd/dpmodel/atomic_model/linear_atomic_model.py‎
Lines changed: 10 additions & 3 deletions b/‎deepmd/dpmodel/atomic_model/linear_atomic_model.py‎
Lines changed: 10 additions & 3 deletions
diff --git a/‎deepmd/dpmodel/common.py‎
Lines changed: 2 additions & 0 deletions b/‎deepmd/dpmodel/common.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎deepmd/dpmodel/descriptor/dpa1.py‎
Lines changed: 1 addition & 0 deletions b/‎deepmd/dpmodel/descriptor/dpa1.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎deepmd/dpmodel/model/__init__.py‎
Lines changed: 4 additions & 0 deletions b/‎deepmd/dpmodel/model/__init__.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎deepmd/dpmodel/model/spin_model.py‎
Lines changed: 66 additions & 9 deletions b/‎deepmd/dpmodel/model/spin_model.py‎
Lines changed: 66 additions & 9 deletions
diff --git a/‎deepmd/dpmodel/output_def.py‎
Lines changed: 15 additions & 1 deletion b/‎deepmd/dpmodel/output_def.py‎
Lines changed: 15 additions & 1 deletion
diff --git a/‎deepmd/pt/model/atomic_model/linear_atomic_model.py‎
Lines changed: 6 additions & 3 deletions b/‎deepmd/pt/model/atomic_model/linear_atomic_model.py‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎deepmd/pt/model/atomic_model/polar_atomic_model.py‎
Lines changed: 2 additions & 1 deletion b/‎deepmd/pt/model/atomic_model/polar_atomic_model.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎deepmd/pt/model/descriptor/hybrid.py‎
Lines changed: 6 additions & 2 deletions b/‎deepmd/pt/model/descriptor/hybrid.py‎
Lines changed: 6 additions & 2 deletions
@@ -60,6 +60,7 @@ jobs:
     - run: python -m pytest source/tests --durations=0
       env:
         NUM_WORKERS: 0
+        CUDA_VISIBLE_DEVICES: 0
     - name: Download libtorch
       run: |
          wget https://download.pytorch.org/libtorch/cu121/libtorch-cxx11-abi-shared-with-deps-2.2.1%2Bcu121.zip -O libtorch.zip
 
@@ -196,11 +196,11 @@ def forward_atomic(
         ]
         ener_list = []
         for i, model in enumerate(self.models):
-            mapping = self.mapping_list[i]
+            type_map_model = self.mapping_list[i]
             ener_list.append(
                 model.forward_atomic(
                     extended_coord,
-                    mapping[extended_atype],
+                    type_map_model[extended_atype],
                     nlists_[i],
                     mapping,
                     fparam,
@@ -414,7 +414,12 @@ def _compute_weight(
         )
 
         numerator = np.sum(
-            pairwise_rr * np.exp(-pairwise_rr / self.smin_alpha), axis=-1
+            np.where(
+                nlist_larger != -1,
+                pairwise_rr * np.exp(-pairwise_rr / self.smin_alpha),
+                np.zeros_like(nlist_larger),
+            ),
+            axis=-1,
         )  # masked nnei will be zero, no need to handle
         denominator = np.sum(
             np.where(
@@ -436,5 +441,7 @@ def _compute_weight(
             smooth = -6 * u**5 + 15 * u**4 - 10 * u**3 + 1
         coef[mid_mask] = smooth[mid_mask]
         coef[right_mask] = 0
+        # to handle masked atoms
+        coef = np.where(sigma != 0, coef, np.zeros_like(coef))
         self.zbl_weight = coef
         return [1 - np.expand_dims(coef, -1), np.expand_dims(coef, -1)]
@@ -24,6 +24,7 @@
     "double": np.float64,
     "int32": np.int32,
     "int64": np.int64,
+    "bool": bool,
     "default": GLOBAL_NP_FLOAT_PRECISION,
     # NumPy doesn't have bfloat16 (and does't plan to add)
     # ml_dtypes is a solution, but it seems not supporting np.save/np.load
@@ -39,6 +40,7 @@
     np.int32: "int32",
     np.int64: "int64",
     ml_dtypes.bfloat16: "bfloat16",
+    bool: "bool",
 }
 assert set(RESERVED_PRECISON_DICT.keys()) == set(PRECISION_DICT.values())
 DEFAULT_PRECISION = "float64"
 
@@ -61,6 +61,7 @@
 
 
 def np_softmax(x, axis=-1):
+    x = np.nan_to_num(x)  # to avoid value warning
     e_x = np.exp(x - np.max(x, axis=axis, keepdims=True))
     return e_x / np.sum(e_x, axis=axis, keepdims=True)
 
 
@@ -15,6 +15,9 @@
 from .dp_model import (
     DPModelCommon,
 )
+from .ener_model import (
+    EnergyModel,
+)
 from .make_model import (
     make_model,
 )
@@ -23,6 +26,7 @@
 )
 
 __all__ = [
+    "EnergyModel",
     "DPModelCommon",
     "SpinModel",
     "make_model",
 
@@ -10,15 +10,21 @@
 from deepmd.dpmodel.atomic_model.dp_atomic_model import (
     DPAtomicModel,
 )
+from deepmd.dpmodel.common import (
+    NativeOP,
+)
 from deepmd.dpmodel.model.make_model import (
     make_model,
 )
+from deepmd.dpmodel.output_def import (
+    ModelOutputDef,
+)
 from deepmd.utils.spin import (
     Spin,
 )
 
 
-class SpinModel:
+class SpinModel(NativeOP):
     """A spin model wrapper, with spin input preprocess and output split."""
 
     def __init__(
@@ -152,15 +158,20 @@ def extend_nlist(extended_atype, nlist):
         nlist_shift = nlist + nall
         nlist[~nlist_mask] = -1
         nlist_shift[~nlist_mask] = -1
-        self_spin = np.arange(0, nloc, dtype=nlist.dtype) + nall
-        self_spin = self_spin.reshape(1, -1, 1).repeat(nframes, axis=0)
-        # self spin + real neighbor + virtual neighbor
+        self_real = (
+            np.arange(0, nloc, dtype=nlist.dtype)
+            .reshape(1, -1, 1)
+            .repeat(nframes, axis=0)
+        )
+        self_spin = self_real + nall
+        # real atom's neighbors: self spin + real neighbor + virtual neighbor
+        # nf x nloc x (1 + nnei + nnei)
+        real_nlist = np.concatenate([self_spin, nlist, nlist_shift], axis=-1)
+        # spin atom's neighbors: real + real neighbor + virtual neighbor
         # nf x nloc x (1 + nnei + nnei)
-        extended_nlist = np.concatenate([self_spin, nlist, nlist_shift], axis=-1)
+        spin_nlist = np.concatenate([self_real, nlist, nlist_shift], axis=-1)
         # nf x (nloc + nloc) x (1 + nnei + nnei)
-        extended_nlist = np.concatenate(
-            [extended_nlist, -1 * np.ones_like(extended_nlist)], axis=-2
-        )
+        extended_nlist = np.concatenate([real_nlist, spin_nlist], axis=-2)
         # update the index for switch
         first_part_index = (nloc <= extended_nlist) & (extended_nlist < nall)
         second_part_index = (nall <= extended_nlist) & (extended_nlist < (nall + nloc))
@@ -187,12 +198,40 @@ def concat_switch_virtual(extended_tensor, extended_tensor_virtual, nloc: int):
         extended_tensor_updated[:, nloc + nall :] = extended_tensor_virtual[:, nloc:]
         return extended_tensor_updated.reshape(out_shape)
 
+    @staticmethod
+    def expand_aparam(aparam, nloc: int):
+        """Expand the atom parameters for virtual atoms if necessary."""
+        nframes, natom, numb_aparam = aparam.shape
+        if natom == nloc:  # good
+            pass
+        elif natom < nloc:  # for spin with virtual atoms
+            aparam = np.concatenate(
+                [
+                    aparam,
+                    np.zeros(
+                        [nframes, nloc - natom, numb_aparam],
+                        dtype=aparam.dtype,
+                    ),
+                ],
+                axis=1,
+            )
+        else:
+            raise ValueError(
+                f"get an input aparam with {aparam.shape[1]} inputs, ",
+                f"which is larger than {nloc} atoms.",
+            )
+        return aparam
+
     def get_type_map(self) -> List[str]:
         """Get the type map."""
         tmap = self.backbone_model.get_type_map()
         ntypes = len(tmap) // 2  # ignore the virtual type
         return tmap[:ntypes]
 
+    def get_ntypes(self):
+        """Returns the number of element types."""
+        return len(self.get_type_map())
+
     def get_rcut(self):
         """Get the cut-off radius."""
         return self.backbone_model.get_rcut()
@@ -251,6 +290,16 @@ def has_spin() -> bool:
         """Returns whether it has spin input and output."""
         return True
 
+    def model_output_def(self):
+        """Get the output def for the model."""
+        model_output_type = self.backbone_model.model_output_type()
+        if "mask" in model_output_type:
+            model_output_type.pop(model_output_type.index("mask"))
+        var_name = model_output_type[0]
+        backbone_model_atomic_output_def = self.backbone_model.atomic_output_def()
+        backbone_model_atomic_output_def[var_name].magnetic = True
+        return ModelOutputDef(backbone_model_atomic_output_def)
+
     def __getattr__(self, name):
         """Get attribute from the wrapped model."""
         if name in self.__dict__:
@@ -313,8 +362,12 @@ def call(
             The keys are defined by the `ModelOutputDef`.
 
         """
-        nframes, nloc = coord.shape[:2]
+        nframes, nloc = atype.shape[:2]
+        coord = coord.reshape(nframes, nloc, 3)
+        spin = spin.reshape(nframes, nloc, 3)
         coord_updated, atype_updated = self.process_spin_input(coord, atype, spin)
+        if aparam is not None:
+            aparam = self.expand_aparam(aparam, nloc * 2)
         model_predict = self.backbone_model.call(
             coord_updated,
             atype_updated,
@@ -383,6 +436,8 @@ def call_lower(
         ) = self.process_spin_input_lower(
             extended_coord, extended_atype, extended_spin, nlist, mapping=mapping
         )
+        if aparam is not None:
+            aparam = self.expand_aparam(aparam, nloc * 2)
         model_predict = self.backbone_model.call_lower(
             extended_coord_updated,
             extended_atype_updated,
@@ -401,3 +456,5 @@ def call_lower(
         )[0]
         # for now omit the grad output
         return model_predict
+
+    forward_lower = call_lower
@@ -228,6 +228,11 @@ def __init__(
     def size(self):
         return self.output_size
 
+    def squeeze(self, dim):
+        # squeeze the shape on given dimension
+        if -len(self.shape) <= dim < len(self.shape) and self.shape[dim] == 1:
+            self.shape.pop(dim)
+
 
 class FittingOutputDef:
     """Defines the shapes and other properties of the fitting network outputs.
@@ -306,7 +311,6 @@ def __getitem__(
 
     def get_data(
         self,
-        key: str,
     ) -> Dict[str, OutputVariableDef]:
         return self.var_defs
 
@@ -402,6 +406,16 @@ def check_operation_applied(
     return var_def.category & op.value == op.value
 
 
+def check_deriv(var_def: OutputVariableDef) -> bool:
+    """Check if a variable is obtained by derivative."""
+    deriv = (
+        check_operation_applied(var_def, OutputVariableOperation.DERV_R)
+        or check_operation_applied(var_def, OutputVariableOperation._SEC_DERV_R)
+        or check_operation_applied(var_def, OutputVariableOperation.DERV_C)
+    )
+    return deriv
+
+
 def do_reduce(
     def_outp_data: Dict[str, OutputVariableDef],
 ) -> Dict[str, OutputVariableDef]:
 
@@ -224,12 +224,12 @@ def forward_atomic(
         ener_list = []
 
         for i, model in enumerate(self.models):
-            mapping = self.mapping_list[i]
+            type_map_model = self.mapping_list[i].to(extended_atype.device)
             # apply bias to each individual model
             ener_list.append(
                 model.forward_common_atomic(
                     extended_coord,
-                    mapping[extended_atype],
+                    type_map_model[extended_atype],
                     nlists_[i],
                     mapping,
                     fparam,
@@ -239,7 +239,10 @@ def forward_atomic(
         weights = self._compute_weight(extended_coord, extended_atype, nlists_)
 
         fit_ret = {
-            "energy": torch.sum(torch.stack(ener_list) * torch.stack(weights), dim=0),
+            "energy": torch.sum(
+                torch.stack(ener_list) * torch.stack(weights).to(extended_atype.device),
+                dim=0,
+            ),
         }  # (nframes, nloc, 1)
         return fit_ret
 
 
@@ -49,7 +49,8 @@ def apply_out_stat(
 
                 # (nframes, nloc, 1)
                 modified_bias = (
-                    modified_bias.unsqueeze(-1) * self.fitting_net.scale[atype]
+                    modified_bias.unsqueeze(-1)
+                    * (self.fitting_net.scale.to(atype.device))[atype]
                 )
 
                 eye = torch.eye(3, dtype=dtype, device=device)
 
@@ -43,6 +43,8 @@ class DescrptHybrid(BaseDescriptor, torch.nn.Module):
         The descriptor can be either an object or a dictionary.
     """
 
+    nlist_cut_idx: List[torch.Tensor]
+
     def __init__(
         self,
         list: List[Union[BaseDescriptor, Dict[str, Any]]],
@@ -278,11 +280,13 @@ def forward(
         for ii, descrpt in enumerate(self.descrpt_list):
             # cut the nlist to the correct length
             if self.mixed_types() == descrpt.mixed_types():
-                nl = nlist[:, :, self.nlist_cut_idx[ii]]
+                nl = nlist[:, :, self.nlist_cut_idx[ii].to(atype_ext.device)]
             else:
                 # mixed_types is True, but descrpt.mixed_types is False
                 assert nl_distinguish_types is not None
-                nl = nl_distinguish_types[:, :, self.nlist_cut_idx[ii]]
+                nl = nl_distinguish_types[
+                    :, :, self.nlist_cut_idx[ii].to(atype_ext.device)
+                ]
             odescriptor, gr, g2, h2, sw = descrpt(coord_ext, atype_ext, nl, mapping)
             out_descriptor.append(odescriptor)
             if gr is not None:
Original file line number	Diff line number	Diff line change
`@@ -15,6 +15,9 @@`
`15`	`15`	`from .dp_model import (`
`16`	`16`	`DPModelCommon,`
`17`	`17`	`)`
	`18`	`+from .ener_model import (`
	`19`	`+ EnergyModel,`
	`20`	`+)`
`18`	`21`	`from .make_model import (`
`19`	`22`	`make_model,`
`20`	`23`	`)`
`@@ -23,6 +26,7 @@`
`23`	`26`	`)`
`24`	`27`
`25`	`28`	`__all__ = [`
	`29`	`+ "EnergyModel",`
`26`	`30`	`"DPModelCommon",`
`27`	`31`	`"SpinModel",`
`28`	`32`	`"make_model",`
Original file line number	Diff line number	Diff line change
`@@ -49,7 +49,8 @@ def apply_out_stat(`
`49`	`49`
`50`	`50`	`# (nframes, nloc, 1)`
`51`	`51`	`modified_bias = (`
`52`		`- modified_bias.unsqueeze(-1) * self.fitting_net.scale[atype]`
	`52`	`+ modified_bias.unsqueeze(-1)`
	`53`	`+ * (self.fitting_net.scale.to(atype.device))[atype]`
`53`	`54`	`)`
`54`	`55`
`55`	`56`	`eye = torch.eye(3, dtype=dtype, device=device)`