v13/src_2parallel_2decompose_2decompositionMethods_2simple_2simple_8C_source.html

 /*---------------------------------------------------------------------------*\

   =========                 |

   \\      /  F ield         | OpenFOAM: The Open Source CFD Toolbox

    \\    /   O peration     | Website:  https://openfoam.org

     \\  /    A nd           | Copyright (C) 2011-2024 OpenFOAM Foundation

      \\/     M anipulation  |

 -------------------------------------------------------------------------------

 License

     This file is part of OpenFOAM.


     OpenFOAM is free software: you can redistribute it and/or modify it

     under the terms of the GNU General Public License as published by

     the Free Software Foundation, either version 3 of the License, or

     (at your option) any later version.


     OpenFOAM is distributed in the hope that it will be useful, but WITHOUT

     ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

     FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License

     for more details.


     You should have received a copy of the GNU General Public License

     along with OpenFOAM.  If not, see <http://www.gnu.org/licenses/>.


 \*---------------------------------------------------------------------------*/


 #include "simple.H"

 #include "addToRunTimeSelectionTable.H"

 #include "SortableList.H"

 #include "globalIndex.H"

 #include "SubField.H"


 // * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * //


 namespace Foam

 {

 namespace decompositionMethods

 {

     defineTypeNameAndDebug(simple, 0);


     addToRunTimeSelectionTable

     (

         decompositionMethod,

         simple,

         decomposer

     );


     addToRunTimeSelectionTable

     (

         decompositionMethod,

         simple,

         distributor

     );

 }

 }


 // * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * //


 // assignToProcessorGroup : given nCells cells and nProcGroup processor

 // groups to share them, how do we share them out? Answer : each group

 // gets nCells/nProcGroup cells, and the first few get one

 // extra to make up the numbers. This should produce almost

 // perfect load balancing


 void Foam::decompositionMethods::simple::assignToProcessorGroup

 (

     labelList& processorGroup,

     const label nProcGroup

 ) const

 {

     label jump = processorGroup.size()/nProcGroup;

     label jumpb = jump + 1;

     label fstProcessorGroup = processorGroup.size() - jump*nProcGroup;


     label ind = 0;

     label j = 0;


     // assign cells to the first few processor groups (those with

     // one extra cell each

     for (j=0; j<fstProcessorGroup; j++)

     {

         for (label k=0; k<jumpb; k++)

         {

             processorGroup[ind++] = j;

         }

     }


     // and now to the `normal' processor groups

     for (; j<nProcGroup; j++)

     {

         for (label k=0; k<jump; k++)

         {

             processorGroup[ind++] = j;

         }

     }

 }


 void Foam::decompositionMethods::simple::assignToProcessorGroup

 (

     labelList& processorGroup,

     const label nProcGroup,

     const labelList& indices,

     const scalarField& weights,

     const scalar summedWeights

 ) const

 {

     // This routine gets the sorted points.

     // Easiest to explain with an example.

     // E.g. 400 points, sum of weights : 513.

     // Now with number of divisions in this direction (nProcGroup) : 4

     // gives the split at 513/4 = 128

     // So summed weight from 0..128 goes into bin 0,

     //     ,,              128..256 goes into bin 1

     //   etc.

     // Finally any remaining ones go into the last bin (3).


     const scalar jump = summedWeights/nProcGroup;

     const label nProcGroupM1 = nProcGroup - 1;

     scalar sumWeights = 0;

     label ind = 0;

     label j = 0;


     // assign cells to all except last group.

     for (j=0; j<nProcGroupM1; j++)

     {

         const scalar limit = jump*scalar(j + 1);

         while (sumWeights < limit)

         {

             sumWeights += weights[indices[ind]];

             processorGroup[ind++] = j;

         }

     }

     // Ensure last included.

     while (ind < processorGroup.size())

     {

        processorGroup[ind++] = nProcGroupM1;

     }

 }


 Foam::labelList Foam::decompositionMethods::simple::decomposeOneProc

 (

     const pointField& points

 ) const

 {

     // construct a list for the final result

     labelList finalDecomp(points.size());


     labelList processorGroups(points.size());


     labelList pointIndices(points.size());

     forAll(pointIndices, i)

     {

         pointIndices[i] = i;

     }


     const pointField rotatedPoints(rotDelta_ & points);


     // and one to take the processor group id's. For each direction.

     // we assign the processors to groups of processors labelled

     // 0..nX to give a banded structure on the mesh. Then we

     // construct the actual processor number by treating this as

     // the units part of the processor number.

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::X))

     );


     assignToProcessorGroup(processorGroups, n_.x());


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] = processorGroups[i];

     }


     // now do the same thing in the Y direction. These processor group

     // numbers add multiples of nX to the proc. number (columns)

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::Y))

     );


     assignToProcessorGroup(processorGroups, n_.y());


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] += n_.x()*processorGroups[i];

     }


     // finally in the Z direction. Now we add multiples of nX*nY to give

     // layers

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::Z))

     );


     assignToProcessorGroup(processorGroups, n_.z());


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] += n_.x()*n_.y()*processorGroups[i];

     }


     return finalDecomp;

 }


 Foam::labelList Foam::decompositionMethods::simple::decomposeOneProc

 (

     const pointField& points,

     const scalarField& weights

 ) const

 {

     // construct a list for the final result

     labelList finalDecomp(points.size());


     labelList processorGroups(points.size());


     labelList pointIndices(points.size());

     forAll(pointIndices, i)

     {

         pointIndices[i] = i;

     }


     const pointField rotatedPoints(rotDelta_ & points);


     // and one to take the processor group id's. For each direction.

     // we assign the processors to groups of processors labelled

     // 0..nX to give a banded structure on the mesh. Then we

     // construct the actual processor number by treating this as

     // the units part of the processor number.

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::X))

     );


     const scalar summedWeights = sum(weights);

     assignToProcessorGroup

     (

         processorGroups,

         n_.x(),

         pointIndices,

         weights,

         summedWeights

     );


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] = processorGroups[i];

     }


     // now do the same thing in the Y direction. These processor group

     // numbers add multiples of nX to the proc. number (columns)

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::Y))

     );


     assignToProcessorGroup

     (

         processorGroups,

         n_.y(),

         pointIndices,

         weights,

         summedWeights

     );


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] += n_.x()*processorGroups[i];

     }


     // finally in the Z direction. Now we add multiples of nX*nY to give

     // layers

     sort

     (

         pointIndices,

         UList<scalar>::less(rotatedPoints.component(vector::Z))

     );


     assignToProcessorGroup

     (

         processorGroups,

         n_.z(),

         pointIndices,

         weights,

         summedWeights

     );


     forAll(points, i)

     {

         finalDecomp[pointIndices[i]] += n_.x()*n_.y()*processorGroups[i];

     }


     return finalDecomp;

 }


 // * * * * * * * * * * * * * * * * Constructors  * * * * * * * * * * * * * * //


 Foam::decompositionMethods::simple::simple

 (

     const dictionary& decompositionDict,

     const dictionary& methodDict

 )

 :

     geometric(decompositionDict, methodDict)

 {}


 // * * * * * * * * * * * * * * * Member Functions  * * * * * * * * * * * * * //


 Foam::labelList Foam::decompositionMethods::simple::decompose

 (

     const pointField& points

 )

 {

     if (!Pstream::parRun())

     {

         return decomposeOneProc(points);

     }

     else

     {

         globalIndex globalNumbers(points.size());


         // Collect all points on master

         if (Pstream::master())

         {

             pointField allPoints(globalNumbers.size());


             label nTotalPoints = 0;

             // Master first

             SubField<point>(allPoints, points.size()) = points;

             nTotalPoints += points.size();


             // Add slaves

             for (int slave=1; slave<Pstream::nProcs(); slave++)

             {

                 IPstream fromSlave(Pstream::commsTypes::scheduled, slave);

                 pointField nbrPoints(fromSlave);

                 SubField<point>

                 (

                     allPoints,

                     nbrPoints.size(),

                     nTotalPoints

                 ) = nbrPoints;

                 nTotalPoints += nbrPoints.size();

             }


             // Decompose

             labelList finalDecomp(decomposeOneProc(allPoints));


             // Send back

             for (int slave=1; slave<Pstream::nProcs(); slave++)

             {

                 OPstream toSlave(Pstream::commsTypes::scheduled, slave);

                 toSlave << SubField<label>

                 (

                     finalDecomp,

                     globalNumbers.localSize(slave),

                     globalNumbers.offset(slave)

                 );

             }

             // Get my own part

             finalDecomp.setSize(points.size());


             return finalDecomp;

         }

         else

         {

             // Send my points

             {

                 OPstream toMaster

                 (

                     Pstream::commsTypes::scheduled,

                     Pstream::masterNo()

                 );

                 toMaster<< points;

             }


             // Receive back decomposition

             IPstream fromMaster

             (

                 Pstream::commsTypes::scheduled,

                 Pstream::masterNo()

             );

             labelList finalDecomp(fromMaster);


             return finalDecomp;

         }

     }

 }


 Foam::labelList Foam::decompositionMethods::simple::decompose

 (

     const pointField& points,

     const scalarField& weights

 )

 {

     checkWeights(points, weights);


     if (!Pstream::parRun())

     {

         return decomposeOneProc(points, weights);

     }

     else

     {

         globalIndex globalNumbers(points.size());


         // Collect all points on master

         if (Pstream::master())

         {

             pointField allPoints(globalNumbers.size());

             scalarField allWeights(allPoints.size());


             label nTotalPoints = 0;

             // Master first

             SubField<point>(allPoints, points.size()) = points;

             SubField<scalar>(allWeights, points.size()) = weights;

             nTotalPoints += points.size();


             // Add slaves

             for (int slave=1; slave<Pstream::nProcs(); slave++)

             {

                 IPstream fromSlave(Pstream::commsTypes::scheduled, slave);

                 pointField nbrPoints(fromSlave);

                 scalarField nbrWeights(fromSlave);

                 SubField<point>

                 (

                     allPoints,

                     nbrPoints.size(),

                     nTotalPoints

                 ) = nbrPoints;

                 SubField<scalar>

                 (

                     allWeights,

                     nbrWeights.size(),

                     nTotalPoints

                 ) = nbrWeights;

                 nTotalPoints += nbrPoints.size();

             }


             // Decompose

             labelList finalDecomp(decomposeOneProc(allPoints, allWeights));


             // Send back

             for (int slave=1; slave<Pstream::nProcs(); slave++)

             {

                 OPstream toSlave(Pstream::commsTypes::scheduled, slave);

                 toSlave << SubField<label>

                 (

                     finalDecomp,

                     globalNumbers.localSize(slave),

                     globalNumbers.offset(slave)

                 );

             }

             // Get my own part

             finalDecomp.setSize(points.size());


             return finalDecomp;

         }

         else

         {

             // Send my points

             {

                 OPstream toMaster

                 (

                     Pstream::commsTypes::scheduled,

                     Pstream::masterNo()

                 );

                 toMaster<< points << weights;

             }


             // Receive back decomposition

             IPstream fromMaster

             (

                 Pstream::commsTypes::scheduled,

                 Pstream::masterNo()

             );

             labelList finalDecomp(fromMaster);


             return finalDecomp;

         }

     }

 }


 // ************************************************************************* //

k
label k
Definition: LISASMDCalcMethod2.H:41

SortableList.H

SubField.H

forAll
#define forAll(list, i)
Loop across all elements in list.
Definition: UList.H:433

addToRunTimeSelectionTable.H
Macros for easy insertion into run-time selection tables.

simple.H

Foam::Field< vector >

Foam::IPstream
Input inter-processor communications stream.
Definition: IPstream.H:54

Foam::List< label >

Foam::List::size
void size(const label)
Override size to be inconsistent with allocated storage.
Definition: ListI.H:164

Foam::List::setSize
void setSize(const label)
Reset size of List.
Definition: List.C:281

Foam::OPstream
Output inter-processor communications stream.
Definition: OPstream.H:54

Foam::SubField
Pre-declare related SubField type.
Definition: SubField.H:63

Foam::UPstream::commsTypes::scheduled
@ scheduled

Foam::UPstream::masterNo
static int masterNo()
Process index of the master.
Definition: UPstream.H:417

Foam::UPstream::master
static bool master(const label communicator=0)
Am I the master process.
Definition: UPstream.H:423

Foam::UPstream::nProcs
static label nProcs(const label communicator=0)
Number of processes in parallel run.
Definition: UPstream.H:411

Foam::UPstream::parRun
static bool & parRun()
Is this a parallel run?
Definition: UPstream.H:399

Foam::Vector< scalar >::Y
@ Y
Definition: Vector.H:75

Foam::Vector< scalar >::X
@ X
Definition: Vector.H:75

Foam::Vector< scalar >::Z
@ Z
Definition: Vector.H:75

Foam::decompositionMethod
Abstract base class for decomposition.
Definition: decompositionMethod.H:50

Foam::decompositionMethods::geometric
Geometrical domain decomposition.
Definition: geometric.H:52

Foam::decompositionMethods::simple
Definition: simple.H:50

Foam::decompositionMethods::simple::simple
simple(const dictionary &decompositionDict, const dictionary &methodDict)
Construct given the decomposition dictionary.
Definition: simple.C:312

Foam::decompositionMethods::simple::decompose
virtual labelList decompose(const pointField &)
Like decompose but with uniform weights on the points.
Definition: simple.C:324

Foam::dictionary
A list of keywords followed by any number of values (e.g. words and numbers) or sub-dictionaries.
Definition: dictionary.H:162

Foam::globalIndex
Calculates a unique integer (label so might not have enough room - 2G max) for processor + local inde...
Definition: globalIndex.H:64

Foam::globalIndex::localSize
label localSize() const
My local size.
Definition: globalIndexI.H:60

Foam::globalIndex::size
label size() const
Global sum of localSizes.
Definition: globalIndexI.H:66

Foam::globalIndex::offset
label offset(const label proci) const
Start of proci data.
Definition: globalIndexI.H:48

globalIndex.H

points
const pointField & points
Definition: gmvOutputHeader.H:1

Foam::decompositionMethods::defineTypeNameAndDebug
defineTypeNameAndDebug(metis, 0)

Foam::decompositionMethods::addToRunTimeSelectionTable
addToRunTimeSelectionTable(decompositionMethod, metis, decomposer)

Foam
Namespace for OpenFOAM.
Definition: atmBoundaryLayer.H:214

Foam::labelList
List< label > labelList
A List of labels.
Definition: labelList.H:56

Foam::label
intWM_LABEL_SIZE_t label
A label is an int32_t or int64_t as specified by the pre-processor macro WM_LABEL_SIZE.
Definition: label.H:59

Foam::pointField
vectorField pointField
pointField is a vectorField.
Definition: pointFieldFwd.H:42

Foam::limit
complex limit(const complex &, const complex &)
Definition: complexI.H:202

Foam::scalarField
Field< scalar > scalarField
Specialisation of Field<T> for scalar.
Definition: primitiveFieldsFwd.H:48

Foam::sort
void sort(UList< T > &)
Definition: UList.C:115

Foam::sum
dimensioned< Type > sum(const DimensionedField< Type, GeoMesh, PrimitiveField > &df)
Definition: DimensionedFieldFunctions.C:375

Foam::less
static bool less(const vector &x, const vector &y)
To compare normals.
Definition: meshRefinementRefine.C:48