Working JE for entropic spring, code must be cleaned

kocimil1 · kocimil1 · commit 58bc55bd07d9 · 2026-02-19T14:22:51.000+01:00
diff --git a/cpp/common/OpenCL/OCL_MM.h b/cpp/common/OpenCL/OCL_MM.h
@@ -78,15 +78,14 @@ class OCL_MM: public OCLsystem { public:
     int ibuff_atoms=-1,ibuff_aforces=-1,ibuff_neighs=-1,ibuff_neighCell=-1;
     int ibuff_avel=-1,ibuff_cvf=-1, ibuff_neighForce=-1,  ibuff_bkNeighs=-1, ibuff_bkNeighs_new=-1;
     int ibuff_REQs=-1, ibuff_MMpars=-1, ibuff_BLs=-1,ibuff_BKs=-1,ibuff_Ksp=-1, ibuff_Kpp=-1;   // MMFFf4 params
-    int ibuff_lvecs=-1, ibuff_ilvecs=-1,ibuff_MDpars=-1,ibuff_TDrive=-1, ibuff_pbcshifts=-1; 
+    int ibuff_lvecs=-1, ibuff_ilvecs=-1,ibuff_MDpars=-1,ibuff_TDrive=-1, ibuff_pbcshifts=-1, ibuff_jeParams=-1; 
     int ibuff_constr=-1;
     int ibuff_constrK=-1;
     int ibuff_bboxes=-1;
     int ibuff_sysneighs=-1;
     int ibuff_sysbonds=-1;
     int ibuff_averageForces=-1;
     int ibuff_work=-1;
-    int4 jeParams{0,0,0,0};
 
     int ibuff_samp_ps=-1;
     int ibuff_samp_fs=-1;
@@ -233,6 +232,8 @@ class OCL_MM: public OCLsystem { public:
 
         // Buffer for thermodynamic integration - stores accumulated force differences
         ibuff_averageForces   = newBuffer( "averageForces",   nSystems, sizeof(float4), 0, CL_MEM_READ_WRITE );
+        ibuff_work            = newBuffer( "work",            nSystems, sizeof(float),  0, CL_MEM_READ_WRITE );
+        ibuff_jeParams        = newBuffer( "jeParams",        nSystems, sizeof(int4),   0, CL_MEM_READ_WRITE  );
         ibuff_BKs        = newBuffer( "BKs",        nSystems*nnode,  sizeof(float4), 0, CL_MEM_READ_ONLY  );
         ibuff_Ksp        = newBuffer( "Ksp",        nSystems*nnode,  sizeof(float4), 0, CL_MEM_READ_ONLY  );
         ibuff_Kpp        = newBuffer( "Kpp",        nSystems*nnode,  sizeof(float4), 0, CL_MEM_READ_ONLY  );
@@ -606,7 +607,7 @@ class OCL_MM: public OCLsystem { public:
         err |= useArgBuff( ibuff_sysbonds   ); // 14
         err |= useArgBuff( ibuff_averageForces);// 15
         err |= useArgBuff( ibuff_work       ); // 16
-        err |= _useArg( jeParams            ); // 17
+        err |= useArgBuff( ibuff_jeParams   ); // 17
         OCL_checkError(err, "setup_updateAtomsMMFFf4");
         return task;
         // const int4        n,            // 1 // (natoms,nnode) dimensions of the system
diff --git a/cpp/common/molecular/MMFFBuilder.h b/cpp/common/molecular/MMFFBuilder.h
@@ -4186,6 +4186,7 @@ void toMMFFsp3_loc( MMFFsp3_loc& ff, bool bRealloc=true, bool bEPairs=true, bool
             const Atom& A =  atoms[ia];
             ff.apos  [ia] = A.pos;
             ff.atypes[ia] = A.type;
+            ff.REQs  [ia] = A.REQ;
             AtomType& atyp = params->atypes[A.type];
 
             if(A.iconf>=0){
diff --git a/cpp/common/molecular/MolWorld_sp3_multi.h b/cpp/common/molecular/MolWorld_sp3_multi.h
@@ -122,6 +122,7 @@ class MolWorld_sp3_multi : public MolWorld_sp3, public MultiSolverInterface { pu
     Quat4f* MDpars     =0;  // Molecular dynamics params
     Quat4f* TDrive     =0;  // temperature and drived dynamics
     Quat4f* averageForces =0;  // accumulated force differences for thermodynamic integration
+    Quat4i*   jeParams   = 0;  // parameters for Jarzynski Equality [ nSystems ]
 
     Quat4f* constr     =0;
     Quat4f* constrK    =0;
@@ -389,8 +390,8 @@ void TI_step(double lambda, double dE, double sigma, double dLambda, int nMDstep
                 for(int ia=0; ia<ffls[isys].natoms; ia++){
                     if(ffls[isys].atypes[ia]==params.getAtomType("Si")){
                         if(si_count < nCVs){
-                            Quat4f acon  = Quat4f{initial_positions[si_count].x, initial_positions[si_count].y, initial_positions[si_count].z, 1e2f}; 
-                            Quat4f aconK = Quat4f{final_positions[si_count].x,   final_positions[si_count].y,   final_positions[si_count].z,   (float)nLambda}; 
+                            Quat4f acon  = Quat4f{initial_positions[si_count].x, initial_positions[si_count].y, initial_positions[si_count].z, 5.0f}; 
+                            Quat4f aconK = Quat4f{final_positions[si_count].x,   final_positions[si_count].y,   final_positions[si_count].z,   0.0f}; 
                             constr [isys*ocl.nAtoms + ia] = acon;
                             constrK[isys*ocl.nAtoms + ia] = aconK;
                         }
@@ -402,6 +403,7 @@ void TI_step(double lambda, double dE, double sigma, double dLambda, int nMDstep
             upload( ocl.ibuff_constrK, constrK );
 
             double beta = 1.0 / (const_kB * go.T_target);
+            double dLambda = 1.0 / (double)(nLambda - 1);
             nPerVFs = nPerVFs_;
             int nBatches = nMDsteps / (nLambda * nPerVFs);
             if( nBatches < 1 ) nBatches = 1;
@@ -416,20 +418,15 @@ void TI_step(double lambda, double dE, double sigma, double dLambda, int nMDstep
                 printf("  Equilibrating %d steps...\n", nEQsteps);
                 bSaveTrajectory = false;
                 nPerVFs = nEQsteps;                
-                for(int isys=0; isys<nSystems; isys++){
-                    TDrive[isys].z = -1;
-                }
-                ocl.upload( ocl.ibuff_TDrive, TDrive );
+                for(int isys=0; isys<nSystems; isys++){ jeParams[isys].x = -1; }
+                ocl.upload( ocl.ibuff_jeParams, jeParams );
                 run_ocl_opt( nEQsteps, Fconv );
 
                 // 2. Pulling
                 bSaveTrajectory = true;
-                nPerVFs = nPerVFs_; // High resolution pulling
-                std::vector<bool> bExploring_old(nSystems);
-                for(int isys=0; isys<nSystems; isys++){
-                    TDrive[isys].z = 0;
-                }
-                ocl.upload( ocl.ibuff_TDrive, TDrive );
+                nPerVFs = nPerVFs_;
+                for(int isys=0; isys<nSystems; isys++){ jeParams[isys].x = 0; jeParams[isys].y = nLambda; jeParams[isys].z = nPerVFs; jeParams[isys].w = 0; }
+                ocl.upload( ocl.ibuff_jeParams, jeParams );
                 // Clear work buffer
                 float* zero_work = new float[nSystems * nLambda];
                 for(int i=0; i<nSystems * nLambda; i++) zero_work[i] = 0;
@@ -438,16 +435,24 @@ void TI_step(double lambda, double dE, double sigma, double dLambda, int nMDstep
 
                 printf("  Pulling for %d * %d = %d steps...\n", nLambda, nPerVFs, nLambda*nPerVFs);
                 run_ocl_opt( nLambda*nPerVFs, Fconv );
-                for(int isys=0; isys<nSystems; isys++) gopts[isys].bExploring = bExploring_old[isys];
 
                 // 3. Download work and accumulate
                 ocl.download( ocl.ibuff_work, gpu_work );
                 ocl.finishRaw();
+                // DEBUG: Print first few work values for system 0 in first batch
+                if(batch==0){
+                    printf("DEBUG gpu_work[sys=0]: ");
+                    for(int i=0; i<5; i++) printf("[%d]=%g ", i, gpu_work[i]);
+                    printf(" dLambda=%g\n", dLambda);
+                    printf("DEBUG gpu_work[sys=0] dW: ");
+                    for(int i=0; i<5; i++) printf("[%d]=%g ", i, gpu_work[i]*dLambda);
+                    printf("\n");
+                }
                    
                 for(int isys=0; isys<nSystems; isys++){
                     double W_traj = 0;
                     for(int i=0; i<nLambda; i++){
-                        float dW = gpu_work[ isys * nLambda + i ];
+                        float dW = gpu_work[ isys * nLambda + i ]*dLambda;
                         W_traj += (double)dW;
                         //if(isys==0 && i==0) printf("batch %d, isys %d, i %d, W %f\n", batch, isys, i, W);
                         sum_exp_W[i] += exp(-beta * W_traj);
@@ -526,6 +531,7 @@ void realloc( int nSystems_ ){
 
     // Initialize averageForces buffer for thermodynamic integration
     _realloc0( averageForces, nSystems, Quat4fZero );
+    _realloc0( jeParams, nSystems, Quat4iMinusOnes );
 
     _realloc( pbcshifts, ocl.npbc*nSystems );
 
@@ -1180,7 +1186,8 @@ double evalVFs( double Fconv=1e-6 ){
             //     TDrive[isys].z = 0;
             // }
             // printf("evalVFs() TDrive[isys].z = %f\n", TDrive[isys].z);
-            TDrive[isys].z += 1;
+            jeParams[isys].x += 1;
+            jeParams[isys].w = 0;
             // printf("evalVFs() TDrive[isys].z = %f\n", TDrive[isys].z);
             TDrive[isys].w = randf(-1.0,1.0); 
         }else{
@@ -1193,6 +1200,7 @@ double evalVFs( double Fconv=1e-6 ){
     //printf( "MDpars{%g,%g,%g,%g}\n", MDpars[0].x,MDpars[0].y,MDpars[0].z,MDpars[0].w );
     err |= ocl.upload( ocl.ibuff_MDpars, MDpars );
     err |= ocl.upload( ocl.ibuff_TDrive, TDrive );
+    if(jeParams)err |= ocl.upload( ocl.ibuff_jeParams, jeParams );
     err |= ocl.upload( ocl.ibuff_cvf   , cvfs   );
     // //printf("MolWorld_sp3_multi::evalVFs() bGroupUpdate=%i \n", bGroupUpdate );
     // if(bGroupUpdate){
diff --git a/cpp/common_resources/cl/relax_multi.cl b/cpp/common_resources/cl/relax_multi.cl
@@ -915,7 +915,7 @@ __kernel void updateAtomsMMFFf4(
     __global float4*  sysbonds,      // 14 // // contains parameters of bonds (constrains) with neighbor systems   {Lmin,Lmax,Kpres,Ktens}
     __global float4*  averageForces, // 15 // contains average forces on atoms for Thermodynamic Integration
     __global float*   work,          // 16 // contains work recorded at each step for Jarzynski Equality
-    const int4    jeParams
+    __global int4*    jeParams       // 17 // parameters for Jarzynski Equality per system
 ){
     const int natoms=n.x;           // number of atoms
     const int nnode =n.y;           // number of node atoms
@@ -1004,45 +1004,59 @@ __kernel void updateAtomsMMFFf4(
         float4 cons = constr[ iaa ]; // constraints (x,y,z,K)
 
 
-        // if(iS==0 && iG==0)printf("GPU: iS=%i iG=%i cons.w=%g TDrive.z=%g \n", iS, iG, cons.w, TDrive.z );
-        if( work && (cons.w > 0.f) && (TDrive.z >= 0.f) ){
-             float4 consEnd = constrK[ iaa ];
-             int nLambda    = (int)consEnd.w;
-             float lambda   = TDrive.z/(float)(nLambda-1);
-             float k        = cons.w; // Stiffness stored in .w
-             
-             // Interpolate position
-             float3 p0 = cons.xyz;
-             float3 p1 = consEnd.xyz;
-             float3 target = p0 + (p1 - p0) * lambda;
-             
-             // Compute Force (Harmonic)
-             // Force on atom = k * (target - pe)
-             float3 fc = (target - pe.xyz) * (float3){k,k,k};
-             fe.xyz += fc;
-             
-             // Accumulate Work
-             // Work done ON system = integral of (dH/dLambda) dLambda
-             // H_spring = 0.5 * k * (x - x0(lambda))^2
-             // dH/dLambda = k * (x - x0) * (-dx0/dLambda)
-             //            = k * (x - x0) * -(p1 - p0)
-             //            = k * (x0 - x) * (p1 - p0)  = fc * (p1 - p0)
-             // So we accumulate dot(fc, dir).
-             
-             float3 dir = p1 - p0;
-             float work_term = dot(fc, dir);
-             work_term *= 1.0f/(float)(nLambda-1);
-             
-             // Record work at this step if buffer provided
-            {
-                volatile __global float* addr = &work[ nLambda * iS + (int)(TDrive.z) ];
-                float old_val, new_val;
-                do {
-                    old_val = *addr;
-                    new_val = old_val + work_term;
-                } while (atomic_cmpxchg((volatile __global int*)addr, as_int(old_val), as_int(new_val)) != as_int(old_val));
+        // if(iS==0 && iG==0)printf("GPU: iS=%i iG=%i jeParams(%i,%i,%i,%i) \n", iS, iG, jeParams[iS].x, jeParams[iS].y, jeParams[iS].z, jeParams[iS].w );
+        if( (cons.w > 0.f) && (jeParams[iS].x >= -1) ){
+            // Jarzynski equality / Thermodynamic integration
+            // We use standard "constr" for initial position and "constrK" for final position
+            // But we use "cons.w" as stiffness
+            
+            float4 consEnd = constrK[ iaa ];
+            int nLambda    = jeParams[iS].y;
+            float k = cons.w;
+            
+            float lambda;
+            if(jeParams[iS].x < 0){
+                lambda = 0.0f;
+            }else{
+                lambda = (float)jeParams[iS].x/(float)(nLambda-1);
+            }
+            
+            float3 p0 = cons.xyz;
+            float3 p1 = consEnd.xyz;
+            
+            float3 target = p0 + (p1 - p0) * lambda;
+            
+            // Compute Force (Harmonic)
+            // Force on atom = k * (target - pe)
+            float3 fc = (target - pe.xyz) * (float3){k,k,k};
+            fe.xyz += fc;
+            
+            // Accumulate Work
+            // Work done ON system = integral of (dH/dLambda) dLambda
+            // H_spring = 0.5 * k * (x - x0(lambda))^2
+            // dH/dLambda = k * (x - x0) * (-dx0/dLambda)
+            //            = k * (x - x0) * -(p1 - p0)
+            //            = k * (x0 - x) * (p1 - p0)  = fc * (p1 - p0)
+            // So we accumulate dot(fc, dir).
+            
+            float3 dir = p1 - p0;
+            float work_term = dot(fc, dir);
+            if( (jeParams[iS].w >= jeParams[iS].z - 1) && (jeParams[iS].x >= 0) ){
+                // Record work at this step if buffer provided
+                {
+                    volatile __global float* addr = &work[ nLambda * iS + jeParams[iS].x ];
+                    float old_val, new_val;
+                    do {
+                        old_val = *addr;
+                        new_val = old_val + work_term;
+                    } while (atomic_cmpxchg((volatile __global int*)addr, as_int(old_val), as_int(new_val)) != as_int(old_val));
+
+                }                    
+            }
+            else if(iG==0){
+                jeParams[iS].w += 1;
             }
-             cons.w = 0.0f; // Disable standard logic
+            cons.w = 0.0f; // Disable standard logic
         }
 
         if( cons.w>0.f && (cons.w<1e3f) ){            // if stiffness is positive, we have constraint
diff --git a/cpp/common_resources/xyz/DA.xyz b/cpp/common_resources/xyz/DA.xyz
@@ -0,0 +1,48 @@
+46
+*****
+C         -4.65120        3.04710       -3.84360
+C         -3.28410        3.28530       -3.99840
+N         -2.40600        2.76310       -3.10520
+C         -2.84070        2.01120       -2.06220
+H         -1.38350        2.94170       -3.22170    +0.5
+C         -4.20780        1.77020       -1.90350
+N         -5.10890        2.29170       -2.79860
+H         -2.13080        1.59950       -1.35570
+H         -4.51570        1.16740       -1.06160
+H         -5.34170        3.47030       -4.56440
+H         -2.92740        3.88370       -4.82730
+C         -6.57120        2.08830       -2.70790
+C         -7.03990        1.23320       -1.51740
+H         -6.91820        1.59760       -3.64470
+H         -7.06190        3.08440       -2.63310
+C         -8.56180        1.08550       -1.51490
+H         -6.72840        1.71970       -0.56730
+H         -6.58440        0.22110       -1.58710
+Si        -9.13340       -0.00000        0.00000
+H         -8.90030        0.59210       -2.45070
+H         -9.04310        2.08360       -1.43570
+H         -8.48770       -1.40530       -0.10220
+H        -10.67720       -0.13500       -0.01720
+H         -8.68590        0.68140        1.31820
+C          2.61800        2.00310       -0.26920
+C          4.54350        3.38240       -0.13910
+C          1.78880        3.12720       -0.28380
+C          3.74330        4.52820       -0.15140
+C          2.35740        4.39800       -0.22430
+H          4.20280        5.50830       -0.10450
+H          0.71370        3.00530       -0.34100
+N          3.98010        2.12990       -0.19780
+H          5.61230        3.52730       -0.08190
+H          2.15940        1.02180       -0.31600
+C          4.76620        0.87660       -0.18910
+C          6.29220        1.05990       -0.11040
+H          4.53420        0.30840       -1.11750
+H          4.44580        0.26500        0.68390
+H          6.64260        1.64330       -0.98950
+C          7.00740       -0.28990       -0.10880
+H          6.55470        1.59910        0.82570
+H          6.77500       -0.84990       -1.03970
+H          6.68820       -0.89380        0.76710
+Si         9.13340       -0.00000       -0.00000 
+O          1.6481         5.3886        -0.2359 
+E          0.6481         5.3886        -0.2359   -0.5
diff --git a/examples/tFreeEnergy_multi/constraints_DA.txt b/examples/tFreeEnergy_multi/constraints_DA.txt
@@ -1,13 +1,2 @@
-# Constraint positions for DA (dimer) thermodynamic integration
-#
-# Format: atom_index  initial_x  initial_y  initial_z  final_x  final_y  final_z
-#
-# CV: Distance between the two Si atoms (indices 18 and 43 in 0-indexed)
-# Si atoms from DA.mol2:
-#   Atom 19 (index 18): Si at (-12.0498, -6.8896, 1.7148)
-#   Atom 44 (index 43): Si at (3.1486, -10.9881, 10.9822)
-#
-# Initial distance ~18Å, pulling from 1Å to 20Å on x-axis
-
-18   0.5   0.0   0.0   10.0   0.0   0.0
-43  -0.5   0.0   0.0  -10.0   0.0   0.0
+18   5.5   0.0   0.0   30.0   0.0   0.0
+43  -5.5   0.0   0.0  -30.0   0.0   0.0
diff --git a/examples/tFreeEnergy_multi/run_DA.sh b/examples/tFreeEnergy_multi/run_DA.sh
@@ -23,7 +23,7 @@ echo "Step 2: Running Thermodynamic Integration for DA..."
 echo "----------------------------------------"
 python3 run_ES.py \
     --nSys 100 \
-    --xyz_name "../../cpp/common_resources/DA.mol2" \
+    --xyz_name "../../cpp/common_resources/xyz/DA.xyz" \
     --system_name "DA" \
     --nLambda 100 \
     --nMDsteps 2000000 \
diff --git a/examples/tFreeEnergy_multi/run_ES.sh b/examples/tFreeEnergy_multi/run_ES.sh
@@ -18,7 +18,7 @@ while [[ "$#" -gt 0 ]]; do
     shift
 done
 
-N=20
+N=30
 
 # Ensure we are in the script directory
 cd "$(dirname "$0")"
@@ -46,12 +46,12 @@ python3 run_ES.py \
     --nSys 100 \
     --xyz_name "../tMMFF/data/entropic_spring_$N.xyz" \
     --system_name "entropic_spring_$N" \
-    --nLambda 50000 \
-    --nMDsteps 1000000 \
-    --nEQsteps 5000 \
+    --nLambda 100000 \
+    --nMDsteps 100000 \
+    --nEQsteps 50000 \
     --Fconv 1e-6 \
     --constraints "constraints_ES.txt" \
-    --nPerVFs 10
+    --nPerVFs 1
 
 if [ $? -ne 0 ]; then
     echo "ERROR: Calculation failed!"
diff --git a/examples/tMolGUIapp_multi/run.sh b/examples/tMolGUIapp_multi/run.sh
@@ -211,6 +211,7 @@ touch minima.dat
 #./$name -m 2000    -x common_resources/xyz/xylitol_WO_gridFF                 -iParalel 3 -T 300 0.2   -gopt 1000,100000 0.25,1.0 -verb 0 -perframe 100 -grid_nPBC 2,2,0 # -nogridff
 
 
-./$name -m 50 -x common_resources/DA.mol2 -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0
-# ./$name -m 50 -x common_resources/entropic_spring_30.xyz -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0
+# ./$name -m 50 -x common_resources/DA.mol2 -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0
+# ./$name -m 50 -x common_resources/xyz/DA.xyz -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0
+./$name -m 50 -x common_resources/entropic_spring_30.xyz -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0
 # ./$name -m 2 -x common_resources/xyz/nHexadecan.xyz -iParalel 3 -T 300 0.2 -gopt 1000,100000 0.25,1.0