Refactor to use functors like fix_nve_kokkos for proper member variable handling

Copilot · frostedoyster · Copilot · commit c6be45f7d01b · 2025-11-11T11:05:23.000Z
Co-authored-by: frostedoyster &lt;98903385+frostedoyster@users.noreply.github.com&gt;
diff --git a/src/KOKKOS/fix_metatomic_kokkos.cpp b/src/KOKKOS/fix_metatomic_kokkos.cpp
@@ -68,6 +68,15 @@ FixMetatomicKokkos<DeviceType>::~FixMetatomicKokkos() {}
 
 /* ---------------------------------------------------------------------- */
 
+template<class DeviceType>
+void FixMetatomicKokkos<DeviceType>::cleanup_copy()
+{
+  // Clear member data that shouldn't be copied to functors
+  // This is called by functor constructors
+}
+
+/* ---------------------------------------------------------------------- */
+
 template<class DeviceType>
 void FixMetatomicKokkos<DeviceType>::init()
 {
@@ -146,28 +155,13 @@ void FixMetatomicKokkos<DeviceType>::initial_integrate(int /*vflag*/)
   atomKK->sync(execution_space,datamask_read);
   atomKK->modified(execution_space,datamask_modify);
 
-  auto x = atomKK->k_x.view<DeviceType>();
-  auto v = atomKK->k_v.view<DeviceType>();
-  auto f = atomKK->k_f.view<DeviceType>();
-  auto rmass = atomKK->k_rmass.view<DeviceType>();
-  auto mass = atomKK->k_mass.view<DeviceType>();
-  auto type = atomKK->k_type.view<DeviceType>();
-  auto mask = atomKK->k_mask.view<DeviceType>();
-
-  // print the first few entries of v for debugging
-  Kokkos::parallel_for(
-      1,
-      KOKKOS_LAMBDA(int i) {
-        printf("Beginning of initial integrate: v[%d] = (%f, %f, %f)\n",
-                i,
-                v(i, 0),
-                v(i, 1),
-                v(i, 2));
-      }
-  );
-  Kokkos::fence();
-
-  std::cout << "In initial_integrate of fix_metatomic/kk" << std::endl;
+  x = atomKK->k_x.view<DeviceType>();
+  v = atomKK->k_v.view<DeviceType>();
+  f = atomKK->k_f.view<DeviceType>();
+  rmass = atomKK->k_rmass.view<DeviceType>();
+  mass = atomKK->k_mass.view<DeviceType>();
+  type = atomKK->k_type.view<DeviceType>();
+  mask = atomKK->k_mask.view<DeviceType>();
 
   int nlocal = atomKK->nlocal;
   int nghost = atomKK->nghost;
@@ -379,40 +373,69 @@ void FixMetatomicKokkos<DeviceType>::initial_integrate(int /*vflag*/)
     // );
 
   // Apply ML predictions to LAMMPS atoms using Kokkos parallel operations on device
-  int groupbit_copy = groupbit;
-  Kokkos::parallel_for(
-      nlocal,
-      KOKKOS_LAMBDA(int i) {
-          if (mask[i] & groupbit_copy) {
-              // Update positions with ML predictions
-              x(i, 0) = positions_kk(i, 0);
-              x(i, 1) = positions_kk(i, 1);
-              x(i, 2) = positions_kk(i, 2);
-
-              // Update velocities from predicted momenta: v = p / m
-              double mass_i = masses_kk[i];
-              v(i, 0) = momenta_kk(i, 0) / mass_i;
-              v(i, 1) = momenta_kk(i, 1) / mass_i;
-              v(i, 2) = momenta_kk(i, 2) / mass_i;
-          }
-      }
-  );
+  if (rmass.data()) {
+    FixMetatomicKokkosApplyPredictionsFunctor<DeviceType,1> functor(this, positions_kk, momenta_kk, masses_kk);
+    Kokkos::parallel_for(nlocal, functor);
+  } else {
+    FixMetatomicKokkosApplyPredictionsFunctor<DeviceType,0> functor(this, positions_kk, momenta_kk, masses_kk);
+    Kokkos::parallel_for(nlocal, functor);
+  }
+  
+  Kokkos::fence();
+}
+
+/* ---------------------------------------------------------------------- */
+
+template<class DeviceType>
+KOKKOS_INLINE_FUNCTION
+void FixMetatomicKokkos<DeviceType>::apply_predictions_item(
+    int i,
+    const Kokkos::View<double**, DeviceType>& positions_kk,
+    const Kokkos::View<double**, DeviceType>& momenta_kk,
+    const Kokkos::View<double*, DeviceType>& masses_kk) const
+{
+  if (mask[i] & groupbit) {
+    // Update positions with ML predictions
+    x(i, 0) = positions_kk(i, 0);
+    x(i, 1) = positions_kk(i, 1);
+    x(i, 2) = positions_kk(i, 2);
+
+    // Update velocities from predicted momenta: v = p / m
+    double mass_i = masses_kk[i];
+    v(i, 0) = momenta_kk(i, 0) / mass_i;
+    v(i, 1) = momenta_kk(i, 1) / mass_i;
+    v(i, 2) = momenta_kk(i, 2) / mass_i;
+  }
+}
 
-    // debug print
-        // Kokkos::parallel_for(
-        //     std::min(nlocal, 1),
-        //     KOKKOS_LAMBDA(int i) {
-        //         printf("Debug initial_integrate after ML update: x[%d] = (%f, %f, %f), v[%d] = (%f, %f, %f)\n",
-        //                 i,
-        //                 x(i, 0),
-        //                 x(i, 1),
-        //                 x(i, 2),
-        //                 i,
-        //                 v(i, 0),
-        //                 v(i, 1),
-        //                 v(i, 2));
-        //     }
-        // );
+template<class DeviceType>
+KOKKOS_INLINE_FUNCTION
+void FixMetatomicKokkos<DeviceType>::apply_predictions_rmass_item(
+    int i,
+    const Kokkos::View<double**, DeviceType>& positions_kk,
+    const Kokkos::View<double**, DeviceType>& momenta_kk) const
+{
+  if (mask[i] & groupbit) {
+    // Update positions with ML predictions
+    x(i, 0) = positions_kk(i, 0);
+    x(i, 1) = positions_kk(i, 1);
+    x(i, 2) = positions_kk(i, 2);
+
+    // Update velocities from predicted momenta: v = p / m
+    double mass_i = rmass[i];
+    v(i, 0) = momenta_kk(i, 0) / mass_i;
+    v(i, 1) = momenta_kk(i, 1) / mass_i;
+    v(i, 2) = momenta_kk(i, 2) / mass_i;
+  }
+}
+
+/* ---------------------------------------------------------------------- */
+
+template<class DeviceType>
+KOKKOS_INLINE_FUNCTION
+void FixMetatomicKokkos<DeviceType>::post_force_item(int /*i*/) const
+{
+  // Not used - post_force uses deep_copy directly
 }
 
 /* ---------------------------------------------------------------------- */
@@ -447,70 +470,60 @@ void FixMetatomicKokkos<DeviceType>::final_integrate()
   // Apply velocity corrections from forces added after post_force
   // This handles stochastic forces from Langevin thermostats
   atomKK->sync(execution_space, V_MASK | F_MASK | MASK_MASK | RMASS_MASK | TYPE_MASK);
-  atomKK->modified(execution_space, V_MASK);
   
-  auto v = atomKK->k_v.template view<DeviceType>();
-  auto f = atomKK->k_f.template view<DeviceType>();
-  auto rmass = atomKK->k_rmass.template view<DeviceType>();
-  auto mass = atomKK->k_mass.template view<DeviceType>();
-  auto type = atomKK->k_type.template view<DeviceType>();
-  auto mask = atomKK->k_mask.template view<DeviceType>();
-
-  auto f_pre_kk = this->f_pre_kk;
-  auto groupbit = this->groupbit;
+  v = atomKK->k_v.template view<DeviceType>();
+  f = atomKK->k_f.template view<DeviceType>();
+  rmass = atomKK->k_rmass.template view<DeviceType>();
+  mass = atomKK->k_mass.template view<DeviceType>();
+  type = atomKK->k_type.template view<DeviceType>();
+  mask = atomKK->k_mask.template view<DeviceType>();
   
   int nlocal = atomKK->nlocal;
   if (igroup == atomKK->firstgroup) nlocal = atomKK->nfirst;
 
   double dtf = update->dt * force->ftm2v;
-  bool use_rmass = rmass.data() != nullptr;
-
-  // print the first few entries of v for debugging
-//   Kokkos::parallel_for(
-//       std::min(nlocal, 1),
-//       KOKKOS_LAMBDA(int i) {
-//         printf("Debug final_integrate before correction: v[%d] = (%f, %f, %f)\n",
-//                 i,
-//                 v(i, 0),
-//                 v(i, 1),
-//                 v(i, 2));
-//       }
-//   );
-
-  // Apply force corrections using Kokkos parallel operation
-  Kokkos::parallel_for(
-      nlocal,
-      KOKKOS_LAMBDA(int i) {
-          if (mask[i] & groupbit) {
-              double mass_i = use_rmass ? rmass[i] : mass[type[i]];
-              double dtfm = dtf / mass_i;
-              
-              // Apply only the incremental force (f - f_pre) to velocities
-              v(i, 0) += (f(i, 0) - f_pre_kk(i, 0)) * dtfm;
-              v(i, 1) += (f(i, 1) - f_pre_kk(i, 1)) * dtfm;
-              v(i, 2) += (f(i, 2) - f_pre_kk(i, 2)) * dtfm;
-          }
-      }
-  );
 
-//   auto v = atomKK->k_v.template view<DeviceType>();
-
-  // Print the first few entries of v for debugging
-    // Kokkos::parallel_for(
-    //     std::min(nlocal, 1),
-    //     KOKKOS_LAMBDA(int i) {
-    //         printf("Debug final_integrate after correction: v[%d] = (%f, %f, %f)\n",
-    //                 i,
-    //                 v(i, 0),
-    //                 v(i, 1),
-    //                 v(i, 2));
-    //     }
-    // );
+  // Apply force corrections using Kokkos functor
+  if (rmass.data()) {
+    FixMetatomicKokkosFinalIntegrateFunctor<DeviceType,1> functor(this, dtf);
+    Kokkos::parallel_for(nlocal, functor);
+  } else {
+    FixMetatomicKokkosFinalIntegrateFunctor<DeviceType,0> functor(this, dtf);
+    Kokkos::parallel_for(nlocal, functor);
+  }
+  
+  Kokkos::fence();
+  atomKK->modified(execution_space, V_MASK);
+}
 
-    // atomKK->modified(execution_space, ALL_MASK);
+template<class DeviceType>
+KOKKOS_INLINE_FUNCTION
+void FixMetatomicKokkos<DeviceType>::final_integrate_item(int i, double dtf) const
+{
+  if (mask[i] & groupbit) {
+    double mass_i = mass[type[i]];
+    double dtfm = dtf / mass_i;
+    
+    // Apply only the incremental force (f - f_pre) to velocities
+    v(i, 0) += (f(i, 0) - f_pre_kk(i, 0)) * dtfm;
+    v(i, 1) += (f(i, 1) - f_pre_kk(i, 1)) * dtfm;
+    v(i, 2) += (f(i, 2) - f_pre_kk(i, 2)) * dtfm;
+  }
+}
 
-    // atomKK->sync(execution_space, ALL_MASK);
-    // atomKK->modified(execution_space, ALL_MASK);
+template<class DeviceType>
+KOKKOS_INLINE_FUNCTION
+void FixMetatomicKokkos<DeviceType>::final_integrate_rmass_item(int i, double dtf) const
+{
+  if (mask[i] & groupbit) {
+    double mass_i = rmass[i];
+    double dtfm = dtf / mass_i;
+    
+    // Apply only the incremental force (f - f_pre) to velocities
+    v(i, 0) += (f(i, 0) - f_pre_kk(i, 0)) * dtfm;
+    v(i, 1) += (f(i, 1) - f_pre_kk(i, 1)) * dtfm;
+    v(i, 2) += (f(i, 2) - f_pre_kk(i, 2)) * dtfm;
+  }
 }
 
 /* ---------------------------------------------------------------------- */
diff --git a/src/KOKKOS/fix_metatomic_kokkos.h b/src/KOKKOS/fix_metatomic_kokkos.h
@@ -28,6 +28,15 @@ namespace LAMMPS_NS {
 template<class DeviceType>
 class MetatomicSystemAdaptorKokkos;
 
+template<class DeviceType, int RMass>
+struct FixMetatomicKokkosApplyPredictionsFunctor;
+
+template<class DeviceType>
+struct FixMetatomicKokkosPostForceFunctor;
+
+template<class DeviceType, int RMass>
+struct FixMetatomicKokkosFinalIntegrateFunctor;
+
 template<class DeviceType>
 class FixMetatomicKokkos : public FixMetatomic {
  public:
@@ -41,6 +50,22 @@ class FixMetatomicKokkos : public FixMetatomic {
   void post_force(int) override;
   void final_integrate() override;
 
+  KOKKOS_INLINE_FUNCTION
+  void apply_predictions_item(int, const Kokkos::View<double**, DeviceType>&,
+                               const Kokkos::View<double**, DeviceType>&,
+                               const Kokkos::View<double*, DeviceType>&) const;
+  KOKKOS_INLINE_FUNCTION
+  void apply_predictions_rmass_item(int, const Kokkos::View<double**, DeviceType>&,
+                                     const Kokkos::View<double**, DeviceType>&) const;
+  KOKKOS_INLINE_FUNCTION
+  void post_force_item(int) const;
+  KOKKOS_INLINE_FUNCTION
+  void final_integrate_item(int, double) const;
+  KOKKOS_INLINE_FUNCTION
+  void final_integrate_rmass_item(int, double) const;
+
+  void cleanup_copy();
+
  private:
   void pick_device(torch::Device* device, const char* requested);
 
@@ -64,6 +89,57 @@ class FixMetatomicKokkos : public FixMetatomic {
   int datamask_read, datamask_modify;
 };
 
+template<class DeviceType, int RMass>
+struct FixMetatomicKokkosApplyPredictionsFunctor {
+  typedef DeviceType device_type;
+  FixMetatomicKokkos<DeviceType> c;
+  Kokkos::View<double**, DeviceType> positions_kk;
+  Kokkos::View<double**, DeviceType> momenta_kk;
+  Kokkos::View<double*, DeviceType> masses_kk;
+
+  FixMetatomicKokkosApplyPredictionsFunctor(FixMetatomicKokkos<DeviceType>* c_ptr,
+                                             const Kokkos::View<double**, DeviceType>& pos,
+                                             const Kokkos::View<double**, DeviceType>& mom,
+                                             const Kokkos::View<double*, DeviceType>& mass):
+    c(*c_ptr), positions_kk(pos), momenta_kk(mom), masses_kk(mass) {c.cleanup_copy();}
+  
+  KOKKOS_INLINE_FUNCTION
+  void operator()(const int i) const {
+    if (RMass) c.apply_predictions_rmass_item(i, positions_kk, momenta_kk);
+    else c.apply_predictions_item(i, positions_kk, momenta_kk, masses_kk);
+  }
+};
+
+template<class DeviceType>
+struct FixMetatomicKokkosPostForceFunctor {
+  typedef DeviceType device_type;
+  FixMetatomicKokkos<DeviceType> c;
+
+  FixMetatomicKokkosPostForceFunctor(FixMetatomicKokkos<DeviceType>* c_ptr):
+    c(*c_ptr) {c.cleanup_copy();}
+  
+  KOKKOS_INLINE_FUNCTION
+  void operator()(const int i) const {
+    c.post_force_item(i);
+  }
+};
+
+template<class DeviceType, int RMass>
+struct FixMetatomicKokkosFinalIntegrateFunctor {
+  typedef DeviceType device_type;
+  FixMetatomicKokkos<DeviceType> c;
+  double dtf;
+
+  FixMetatomicKokkosFinalIntegrateFunctor(FixMetatomicKokkos<DeviceType>* c_ptr, double dtf_):
+    c(*c_ptr), dtf(dtf_) {c.cleanup_copy();}
+  
+  KOKKOS_INLINE_FUNCTION
+  void operator()(const int i) const {
+    if (RMass) c.final_integrate_rmass_item(i, dtf);
+    else c.final_integrate_item(i, dtf);
+  }
+};
+
 }    // namespace LAMMPS_NS
 
 #endif