doxygen_doc/html/VectorizedCellProcessor_8h_source.html

#ifndef VECTORIZEDCELLPROCESSOR_H_

#define VECTORIZEDCELLPROCESSOR_H_


#include "CellProcessor.h"

#include "utils/AlignedArray.h"

#include <iostream>

#include <vector>

#include <cmath>

#include "vectorization/SIMD_TYPES.h"

#include "vectorization/SIMD_VectorizedCellProcessorHelpers.h"

#include "WrapOpenMP.h"


#include "molecules/MoleculeForwardDeclaration.h"

class Component;

class Domain;

class Comp2Param;

class CellDataSoA;


class VectorizedCellProcessor : public CellProcessor {

    friend class VCP1CLJRMMTest;

public:

    typedef std::vector<Component> ComponentList;


    VectorizedCellProcessor& operator=(const VectorizedCellProcessor&) = delete;


    VectorizedCellProcessor(Domain & domain, double cutoffRadius, double LJcutoffRadius);


    ~~VectorizedCellProcessor();


    void initTraversal();

    void preprocessCell(ParticleCell& /*cell*/) {}


    double processSingleMolecule(Molecule* /*m1*/, ParticleCell& /*cell2*/) {

        return 0.0;

    }


    void processCell(ParticleCell& cell);


        void processCellPair(ParticleCell& cell1, ParticleCell& cell2, bool sumAll = false);


    void postprocessCell(ParticleCell& /*cell*/) {}

    void endTraversal();


private:

    typedef std::vector<Molecule *> MoleculeList;

    Domain & _domain;


    //const double _cutoffRadiusSquare;


    //const double _LJcutoffRadiusSquare;


    const double _epsRFInvrc3;


    std::vector<AlignedArray<vcp_real_calc> > _eps_sig;

    std::vector<AlignedArray<vcp_real_calc> > _shift6;

    double _upot6lj;


    double _upotXpoles;


    double _virial;


    double _myRF;


    struct VLJCPThreadData {

    public:

        VLJCPThreadData(): _ljc_dist_lookup(nullptr), _charges_dist_lookup(nullptr), _dipoles_dist_lookup(nullptr), _quadrupoles_dist_lookup(nullptr){

            _upot6ljV.resize(_numVectorElements);

            _upotXpolesV.resize(_numVectorElements);

            _virialV.resize(_numVectorElements);

            _myRFV.resize(_numVectorElements);


            for (size_t j = 0; j < _numVectorElements; ++j) {

                _upot6ljV[j] = 0.0;

                _upotXpolesV[j] = 0.0;

                _virialV[j] = 0.0;

                _myRFV[j] = 0.0;

            }

        }


        AlignedArray<vcp_lookupOrMask_single> _centers_dist_lookup;


        vcp_lookupOrMask_single* _ljc_dist_lookup;


        vcp_lookupOrMask_single* _charges_dist_lookup;


        vcp_lookupOrMask_single* _dipoles_dist_lookup;


        vcp_lookupOrMask_single* _quadrupoles_dist_lookup;


        AlignedArray<vcp_real_accum> _upot6ljV, _upotXpolesV, _virialV, _myRFV;

    };


    std::vector<VLJCPThreadData *> _threadData;


    static const size_t _numVectorElements = VCP_VEC_SIZE;

    size_t _numThreads;


    template<bool calculateMacroscopic>

    inline void _loopBodyLJ(

            const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

            const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

            const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

            const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

            RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

            RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

            RealAccumVec& sum_upot6lj, RealAccumVec& sum_virial,

            const MaskCalcVec& forceMask,

            const RealCalcVec& eps_24, const RealCalcVec& sig2,

            const RealCalcVec& shift6);


    template<bool calculateMacroscopic>

    inline void _loopBodyCharge(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& qii,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& qjj,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial,

        const MaskCalcVec& forceMask);


    template<bool calculateMacroscopic>

    inline void _loopBodyChargeDipole(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& q,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& e_x, const RealCalcVec& e_y, const RealCalcVec& e_z,

        const RealCalcVec& p,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& M_x, RealAccumVec& M_y, RealAccumVec& M_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial,

        const MaskCalcVec& forceMask);


    template<bool calculateMacroscopic>

    inline void _loopBodyDipole(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& eii_x, const RealCalcVec& eii_y, const RealCalcVec& eii_z,

        const RealCalcVec& pii,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& ejj_x, const RealCalcVec& ejj_y, const RealCalcVec& ejj_z,

        const RealCalcVec& pjj,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& M1_x, RealAccumVec& M1_y, RealAccumVec& M1_z,

        RealAccumVec& M2_x, RealAccumVec& M2_y, RealAccumVec& M2_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial, RealAccumVec& sum_myRF,

        const MaskCalcVec& forceMask,

        const RealCalcVec& epsRFInvrc3);


    template<bool calculateMacroscopic>

    inline void _loopBodyChargeQuadrupole(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& q,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& ejj_x, const RealCalcVec& ejj_y, const RealCalcVec& ejj_z,

        const RealCalcVec& m,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& M_x, RealAccumVec& M_y, RealAccumVec& M_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial,

        const MaskCalcVec& forceMask);


    template<bool calculateMacroscopic>

    inline void _loopBodyDipoleQuadrupole(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& eii_x, const RealCalcVec& eii_y, const RealCalcVec& eii_z,

        const RealCalcVec& p,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& ejj_x, const RealCalcVec& ejj_y, const RealCalcVec& ejj_z,

        const RealCalcVec& m,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& M1_x, RealAccumVec& M1_y, RealAccumVec& M1_z,

        RealAccumVec& M2_x, RealAccumVec& M2_y, RealAccumVec& M2_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial,

        const MaskCalcVec& forceMask);


    template<bool calculateMacroscopic>

    inline void _loopBodyQuadrupole(

        const RealCalcVec& m1_r_x, const RealCalcVec& m1_r_y, const RealCalcVec& m1_r_z,

        const RealCalcVec& r1_x, const RealCalcVec& r1_y, const RealCalcVec& r1_z,

        const RealCalcVec& eii_x, const RealCalcVec& eii_y, const RealCalcVec& eii_z,

        const RealCalcVec& mii,

        const RealCalcVec& m2_r_x, const RealCalcVec& m2_r_y, const RealCalcVec& m2_r_z,

        const RealCalcVec& r2_x, const RealCalcVec& r2_y, const RealCalcVec& r2_z,

        const RealCalcVec& ejj_x, const RealCalcVec& ejj_y, const RealCalcVec& ejj_z,

        const RealCalcVec& mjj,

        RealCalcVec& f_x, RealCalcVec& f_y, RealCalcVec& f_z,

        RealAccumVec& V_x, RealAccumVec& V_y, RealAccumVec& V_z,

        RealAccumVec& Mii_x, RealAccumVec& Mii_y, RealAccumVec& Mii_z,

        RealAccumVec& Mjj_x, RealAccumVec& Mjj_y, RealAccumVec& Mjj_z,

        RealAccumVec& sum_upotXpoles, RealAccumVec& sum_virial,

        const MaskCalcVec& forceMask);


    template<class ForcePolicy, bool CalculateMacroscopic, class MaskGatherChooser>

    void _calculatePairs(CellDataSoA & soa1, CellDataSoA & soa2);


}; /* end of class VectorizedCellProcessor */


#endif /* VECTORIZEDCELLPROCESSOR_H_ */

AlignedArray.h
AlignedArray.h.

SIMD_TYPES.h
Defines the length of the vectors and the corresponding functions.

AlignedArray
An aligned array.
Definition: AlignedArray.h:75

CellDataSoA
Structure of Arrays for vectorized force calculation.
Definition: CellDataSoA.h:22

CellProcessor
Definition: CellProcessor.h:29

Comp2Param
Definition: Comp2Param.h:15

Component
Class implementing molecules as rigid rotators consisting out of different interaction sites (LJcente...
Definition: Component.h:14

Domain
This class is used to read in the phasespace and to handle macroscopic values.
Definition: Domain.h:47

FullMolecule
FullMolecule modeled as LJ sphere with point polarities.
Definition: FullMolecule.h:18

FullParticleCell
FullParticleCell data structure. Renamed from ParticleCell.
Definition: FullParticleCell.h:49

VectorizedCellProcessor
Vectorized calculation of the force.
Definition: VectorizedCellProcessor.h:29

VectorizedCellProcessor::preprocessCell
void preprocessCell(ParticleCell &)
Load the CellDataSoA for cell.
Definition: VectorizedCellProcessor.h:51

VectorizedCellProcessor::postprocessCell
void postprocessCell(ParticleCell &)
Free the LennardJonesSoA for cell.
Definition: VectorizedCellProcessor.h:67

VectorizedCellProcessor::processCellPair
void processCellPair(ParticleCell &cell1, ParticleCell &cell2, bool sumAll=false)
Definition: VectorizedCellProcessor.cpp:2746

VectorizedCellProcessor::endTraversal
void endTraversal()
Store macroscopic values in the Domain.
Definition: VectorizedCellProcessor.cpp:124

VectorizedCellProcessor::processCell
void processCell(ParticleCell &cell)
Calculate forces between pairs of Molecules in cell.
Definition: VectorizedCellProcessor.cpp:2734

VectorizedCellProcessor::initTraversal
void initTraversal()
Reset macroscopic values to 0.0.
Definition: VectorizedCellProcessor.cpp:111

VectorizedCellProcessor::VectorizedCellProcessor
VectorizedCellProcessor(Domain &domain, double cutoffRadius, double LJcutoffRadius)
Construct and set up the internal parameter table.
Definition: VectorizedCellProcessor.cpp:21

vcp::MaskVec
Definition: MaskVec.h:16

vcp::RealVec
Definition: RealVec.h:22