LCOV - code coverage report
Current view: top level - src/grid/cpu - grid_cpu_integrate.c (source / functions) Hit Total Coverage
Test: CP2K Regtests (git:2fce0f8) Lines: 63 63 100.0 %
Date: 2024-12-21 06:28:57 Functions: 2 2 100.0 %

          Line data    Source code
       1             : /*----------------------------------------------------------------------------*/
       2             : /*  CP2K: A general program to perform molecular dynamics simulations         */
       3             : /*  Copyright 2000-2024 CP2K developers group <https://cp2k.org>              */
       4             : /*                                                                            */
       5             : /*  SPDX-License-Identifier: BSD-3-Clause                                     */
       6             : /*----------------------------------------------------------------------------*/
       7             : 
       8             : #include <assert.h>
       9             : #include <limits.h>
      10             : #include <math.h>
      11             : #include <stdio.h>
      12             : #include <stdlib.h>
      13             : #include <string.h>
      14             : 
      15             : #define GRID_DO_COLLOCATE 0
      16             : #include "../common/grid_common.h"
      17             : #include "grid_cpu_collint.h"
      18             : #include "grid_cpu_integrate.h"
      19             : 
      20             : /*******************************************************************************
      21             :  * \brief Cab matrix container to be passed through get_force/virial to cab_get.
      22             :  * \author Ole Schuett
      23             :  ******************************************************************************/
      24             : typedef struct {
      25             :   const double *data;
      26             :   const int m1;
      27             : } cab_store;
      28             : 
      29             : /*******************************************************************************
      30             :  * \brief Returns matrix element cab[idx(b)][idx(a)].
      31             :  * \author Ole Schuett
      32             :  ******************************************************************************/
      33  5167456236 : static inline double cab_get(const cab_store *cab, const orbital a,
      34             :                              const orbital b) {
      35  5167456236 :   return cab->data[idx(b) * cab->m1 + idx(a)];
      36             : }
      37             : 
      38             : #include "../common/grid_process_vab.h"
      39             : 
      40             : /*******************************************************************************
      41             :  * \brief Integrates a single task. See grid_cpu_integrate.h for details.
      42             :  * \author Ole Schuett
      43             :  ******************************************************************************/
      44    87562462 : void grid_cpu_integrate_pgf_product(
      45             :     const bool orthorhombic, const bool compute_tau, const int border_mask,
      46             :     const int la_max, const int la_min, const int lb_max, const int lb_min,
      47             :     const double zeta, const double zetb, const double dh[3][3],
      48             :     const double dh_inv[3][3], const double ra[3], const double rab[3],
      49             :     const int npts_global[3], const int npts_local[3], const int shift_local[3],
      50             :     const int border_width[3], const double radius, const int o1, const int o2,
      51    87562462 :     const int n1, const int n2, const double *grid, double hab[n2][n1],
      52             :     const double pab[n2][n1], double forces[2][3], double virials[2][3][3],
      53             :     double hdab[n2][n1][3], double hadb[n2][n1][3],
      54    87562462 :     double a_hdab[n2][n1][3][3]) {
      55             : 
      56    87562462 :   const bool calculate_forces = (forces != NULL || hdab != NULL);
      57    87562462 :   const bool calculate_virial = (virials != NULL || a_hdab != NULL);
      58    87562462 :   assert(!calculate_virial || calculate_forces);
      59    87562462 :   const process_ldiffs ldiffs =
      60    87562462 :       process_get_ldiffs(calculate_forces, calculate_virial, compute_tau);
      61    87562462 :   int la_max_local = la_max + ldiffs.la_max_diff;
      62    87562462 :   int lb_max_local = lb_max + ldiffs.lb_max_diff;
      63    87562462 :   int la_min_local = imax(0, la_min + ldiffs.la_min_diff);
      64    87562462 :   int lb_min_local = imax(0, lb_min + ldiffs.lb_min_diff);
      65             : 
      66    87562462 :   const int m1 = ncoset(la_max_local);
      67    87562462 :   const int m2 = ncoset(lb_max_local);
      68    87562462 :   double cab[m2 * m1];
      69    87562462 :   memset(cab, 0, m2 * m1 * sizeof(double));
      70             : 
      71    87562462 :   const cab_store cab_obj = {.data = cab, .m1 = m1};
      72             : 
      73    87562462 :   const double rscale = 1.0; // TODO: remove rscale from cab_to_grid
      74    87562462 :   cab_to_grid(orthorhombic, border_mask, la_max_local, la_min_local,
      75             :               lb_max_local, lb_min_local, zeta, zetb, rscale, dh, dh_inv, ra,
      76             :               rab, npts_global, npts_local, shift_local, border_width, radius,
      77             :               cab, grid);
      78             : 
      79             :   //  cab contains all the information needed to find the elements of hab
      80             :   //  and optionally of derivatives of these elements
      81   210157596 :   for (int la = la_min; la <= la_max; la++) {
      82   301932155 :     for (int ax = 0; ax <= la; ax++) {
      83   424126643 :       for (int ay = 0; ay <= la - ax; ay++) {
      84   244789622 :         const int az = la - ax - ay;
      85   244789622 :         const orbital a = {{ax, ay, az}};
      86   645688761 :         for (int lb = lb_min; lb <= lb_max; lb++) {
      87  1037806048 :           for (int bx = 0; bx <= lb; bx++) {
      88  1560171623 :             for (int by = 0; by <= lb - bx; by++) {
      89   923264714 :               const int bz = lb - bx - by;
      90   923264714 :               const orbital b = {{bx, by, bz}};
      91             : 
      92             :               // Update hab block.
      93   923264714 :               hab[o2 + idx(b)][o1 + idx(a)] +=
      94   923264714 :                   get_hab(a, b, zeta, zetb, &cab_obj, compute_tau);
      95             : 
      96             :               // Update forces.
      97   923264714 :               if (forces != NULL) {
      98   140312426 :                 const double pabval = pab[o2 + idx(b)][o1 + idx(a)];
      99   561249704 :                 for (int i = 0; i < 3; i++) {
     100   420937278 :                   forces[0][i] += pabval * get_force_a(a, b, i, zeta, zetb,
     101             :                                                        &cab_obj, compute_tau);
     102   420937278 :                   forces[1][i] += pabval * get_force_b(a, b, i, zeta, zetb, rab,
     103             :                                                        &cab_obj, compute_tau);
     104             :                 }
     105             :               }
     106             : 
     107             :               // Update virials.
     108   923264714 :               if (virials != NULL) {
     109    22034459 :                 const double pabval = pab[o2 + idx(b)][o1 + idx(a)];
     110    88137836 :                 for (int i = 0; i < 3; i++) {
     111   264413508 :                   for (int j = 0; j < 3; j++) {
     112   198310131 :                     virials[0][i][j] +=
     113   198310131 :                         pabval * get_virial_a(a, b, i, j, zeta, zetb, &cab_obj,
     114             :                                               compute_tau);
     115   198310131 :                     virials[1][i][j] +=
     116   198310131 :                         pabval * get_virial_b(a, b, i, j, zeta, zetb, rab,
     117             :                                               &cab_obj, compute_tau);
     118             :                   }
     119             :                 }
     120             :               }
     121             : 
     122             :               // Update hdab, hadb, and a_hdab (not used in batch mode).
     123   923264714 :               if (hdab != NULL) {
     124       16590 :                 assert(!compute_tau);
     125       66360 :                 for (int i = 0; i < 3; i++) {
     126       49770 :                   hdab[o2 + idx(b)][o1 + idx(a)][i] +=
     127       49770 :                       get_force_a(a, b, i, zeta, zetb, &cab_obj, false);
     128             :                 }
     129             :               }
     130   923264714 :               if (hadb != NULL) {
     131        7902 :                 assert(!compute_tau);
     132       31608 :                 for (int i = 0; i < 3; i++) {
     133       23706 :                   hadb[o2 + idx(b)][o1 + idx(a)][i] +=
     134       23706 :                       get_force_b(a, b, i, zeta, zetb, rab, &cab_obj, false);
     135             :                 }
     136             :               }
     137   923264714 :               if (a_hdab != NULL) {
     138         360 :                 assert(!compute_tau);
     139        1440 :                 for (int i = 0; i < 3; i++) {
     140        4320 :                   for (int j = 0; j < 3; j++) {
     141        3240 :                     a_hdab[o2 + idx(b)][o1 + idx(a)][i][j] +=
     142        3240 :                         get_virial_a(a, b, i, j, zeta, zetb, &cab_obj, false);
     143             :                   }
     144             :                 }
     145             :               }
     146             :             }
     147             :           }
     148             :         }
     149             :       }
     150             :     }
     151             :   }
     152    87562462 : }
     153             : 
     154             : // EOF

Generated by: LCOV version 1.15