oomph-lib: double_vector_with_halo.cc Source File

1 // LIC// ====================================================================

2 // LIC// This file forms part of oomph-lib, the object-oriented,

3 // LIC// multi-physics finite-element library, available

4 // LIC// at http://www.oomph-lib.org.

5 // LIC//

7 // LIC//

8 // LIC// This library is free software; you can redistribute it and/or

9 // LIC// modify it under the terms of the GNU Lesser General Public

10 // LIC// License as published by the Free Software Foundation; either

11 // LIC// version 2.1 of the License, or (at your option) any later version.

12 // LIC//

13 // LIC// This library is distributed in the hope that it will be useful,

14 // LIC// but WITHOUT ANY WARRANTY; without even the implied warranty of

15 // LIC// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

16 // LIC// Lesser General Public License for more details.

17 // LIC//

18 // LIC// You should have received a copy of the GNU Lesser General Public

19 // LIC// License along with this library; if not, write to the Free Software

20 // LIC// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA

21 // LIC// 02110-1301 USA.

22 // LIC//

23 // LIC// The authors may be contacted at oomph-lib@maths.man.ac.uk.

24 // LIC//

25 // LIC//====================================================================

26 #include "double_vector_with_halo.h"

28 namespace oomph

29 {

30 //============================================================================

31 /// Constructor that sets up the required information communicating

32 /// between all processors. Requires two "all to all" communications.

33 /// Arguments are the distribution of the DoubleVector and a

34 /// Vector of global unknowns required on this processor.

35 //===========================================================================

36 DoubleVectorHaloScheme::DoubleVectorHaloScheme(

37 LinearAlgebraDistribution* const& dist_pt,

38 const Vector<unsigned>& required_global_eqn)

39 : Distribution_pt(dist_pt)

40 {

41 #ifdef OOMPH_HAS_MPI

42 // Only bother to do anything if the vector is distributed

43 if (dist_pt->distributed())

44 {

45 // First create temporary maps for halo requests.

46 // Using the map structure ensures that the data will be sorted

47 // into processor order: the order of the unsigned integer key

49 // These are the halo requests indexed by master processor and the

50 // local equation number that is to be haloed on that processor

51 std::map<unsigned, Vector<unsigned>> to_be_haloed;

52 // These are the halo requests indexed by master processor and the

53 // index in the additional storage

54 // that corresponds to the halo data on this processor

55 std::map<unsigned, Vector<unsigned>> halo_entries;

57 // Find rank of current processor

58 const unsigned my_rank =

59 static_cast<int>(dist_pt->communicator_pt()->my_rank());

60 // Loop over the desired equations (on this processor)

61 // and work out whether we need to halo them according to the

62 // given distribution

63 const unsigned n_global_eqn = required_global_eqn.size();

64 // Index for the locally stored halo values

65 unsigned index = 0;

66 for (unsigned n = 0; n < n_global_eqn; n++)

67 {

68 // Cache the required GLOBAL equation number

69 const unsigned i_global = required_global_eqn[n];

70 // Where is it stored?

71 unsigned rank_of_global = dist_pt->rank_of_global_row(i_global);

72 // If the equation is not stored locally then

73 // populate the two maps

74 if (my_rank != rank_of_global)

75 {

76 // Work out the local entry on the appropriate processor

77 unsigned i_local = i_global - dist_pt->first_row(rank_of_global);

78 // Mark the local storage index as halo with rank_of_global as master

79 halo_entries[rank_of_global].push_back(index);

80 // Mark the local equation of the rank_of_global as to be

81 // haloed

82 to_be_haloed[rank_of_global].push_back(i_local);

83 // Store the local index corresponding to the global equation

84 Local_index[i_global] = index;

85 // Increment the index

86 ++index;

87 }

88 }

90 // We now need to tell the other processors which of their data are

91 // haloed on this processor

93 // First find out how many processors there are!

94 const int n_proc = dist_pt->communicator_pt()->nproc();

96 // Setup storage for number of data to be sent to each processor

97 Vector<int> send_n(n_proc, 0);

98 Vector<int> send_displacement(n_proc, 0);

99 int send_data_count = 0;

100

101 // Iterate over the entries in the map

102 // This will be in rank order because of the ordering of the map

103 for (std::map<unsigned, Vector<unsigned>>::iterator it =

104 to_be_haloed.begin();

105 it != to_be_haloed.end();

106 ++it)

107 {

108 const unsigned rank = it->first;

109 const unsigned size_ = it->second.size();

110 // The displacement is the current number of data

111 send_displacement[rank] = send_data_count;

112 // The number to send is just the size of the array

113 send_n[rank] = static_cast<int>(size_);

114 send_data_count += size_;

115 }

116

117 // Now send the number of haloed entries from every processor

118 // to every processor

119

120 // Receive the data directly into the storage for haloed daa

121 Haloed_n.resize(n_proc, 0);

122 MPI_Alltoall(&send_n[0],

123 1,

124 MPI_INT,

125 &Haloed_n[0],

126 1,

127 MPI_INT,

128 dist_pt->communicator_pt()->mpi_comm());

129

130 // Prepare the data to be sent

131 // Always resize to at least one

132 if (send_data_count == 0)

133 {

134 ++send_data_count;

135 }

136 Vector<unsigned> send_data(send_data_count);

137 // Iterate over the entries in the map

138 unsigned count = 0;

139 for (std::map<unsigned, Vector<unsigned>>::iterator it =

140 to_be_haloed.begin();

141 it != to_be_haloed.end();

142 ++it)

143 {

144 // Iterate over the vector

145 for (Vector<unsigned>::iterator it2 = it->second.begin();

146 it2 != it->second.end();

147 ++it2)

148 {

149 send_data[count] = (*it2);

150 ++count;

151 }

152 }

153

154 // Prepare the data to be received,

155 // Again this can go directly into Haloed storage

156 int receive_data_count = 0;

157 Haloed_displacement.resize(n_proc);

158 for (int d = 0; d < n_proc; d++)

159 {

160 // The displacement is the amount of data received so far

161 Haloed_displacement[d] = receive_data_count;

162 receive_data_count += Haloed_n[d];

163 }

164

165 // Now resize the receive buffer

166 // Always make sure that it has size of at least one

167 if (receive_data_count == 0)

168 {

169 ++receive_data_count;

170 }

171 Haloed_eqns.resize(receive_data_count);

172 // Send the data between all the processors

173 MPI_Alltoallv(&send_data[0],

174 &send_n[0],

175 &send_displacement[0],

176 MPI_UNSIGNED,

177 &Haloed_eqns[0],

178 &Haloed_n[0],

179 &Haloed_displacement[0],

180 MPI_UNSIGNED,

181 dist_pt->communicator_pt()->mpi_comm());

182

183 // Finally, we translate the map of halo entries into the permanent

184 // storage

185 Halo_n.resize(n_proc, 0);

186 Halo_displacement.resize(n_proc, 0);

187

188 // Loop over all the entries in the map

189 unsigned receive_haloed_count = 0;

190 for (int d = 0; d < n_proc; d++)

191 {

192 // Pointer to the map entry

193 std::map<unsigned, Vector<unsigned>>::iterator it =

194 halo_entries.find(d);

195 // If we don't have it in the map, skip

196 if (it == halo_entries.end())

197 {

198 Halo_displacement[d] = receive_haloed_count;

199 Halo_n[d] = 0;

200 }

201 else

202 {

203 Halo_displacement[d] = receive_haloed_count;

204 const int size_ = it->second.size();

205 Halo_n[d] = size_;

206 // Resize the equations to be sent

207 Halo_eqns.resize(receive_haloed_count + size_);

208 for (int i = 0; i < size_; i++)

209 {

210 Halo_eqns[receive_haloed_count + i] = it->second[i];

211 }

212 receive_haloed_count += size_;

213 }

214 }

215 }

216 #endif

217 }

218

219 //=====================================================================

220 /// Function that sets up a vector of pointers to halo

221 /// data, index using the scheme in Local_index. The first arguement

222 /// is a map of pointers to all halo data index by the global equation

223 /// number

224 //====================================================================

225 void DoubleVectorHaloScheme::setup_halo_dofs(

226 const std::map<unsigned, double*>& halo_data_pt,

227 Vector<double*>& halo_dof_pt)

228 {

229 // How many entries are there in the map

230 unsigned n_halo = Local_index.size();

231 // Resize the vector

232 halo_dof_pt.resize(n_halo);

233

234 // Loop over all the entries in the map

235 for (std::map<unsigned, unsigned>::iterator it = Local_index.begin();

236 it != Local_index.end();

237 ++it)

238 {

239 // Find the pointer in the halo_data_pt map

240 std::map<unsigned, double*>::const_iterator it2 =

241 halo_data_pt.find(it->first);

242 // Did we find it

243 if (it2 != halo_data_pt.end())

244 {

245 // Now set the entry

246 halo_dof_pt[it->second] = it2->second;

247 }

248 else

249 {

250 std::ostringstream error_stream;

251 error_stream << "Global equation " << it->first

252 << " reqired as halo is not stored in halo_data_pt\n";

253

254 throw OomphLibError(

255 error_stream.str(), OOMPH_CURRENT_FUNCTION, OOMPH_EXCEPTION_LOCATION);

256 }

257 }

258 }

259

260 //------------------------------------------------------------------

261 // Member functions for the DoubleVectorWithHaloEntries

262 //-------------------------------------------------------------------

263

264

265 //=========================================================================

266 /// Synchronise the halo data within the vector. This requires one

267 /// "all to all" communnication.

268 //====================================================================

269 void DoubleVectorWithHaloEntries::synchronise()

270 {

271 #ifdef OOMPH_HAS_MPI

272 // Only need to do anything if the DoubleVector is distributed

273 if (this->distributed())

274 {

275 // Read out the number of entries to send

276 const unsigned n_send = Halo_scheme_pt->Haloed_eqns.size();

277 Vector<double> send_data(n_send);

278 // Read out the data values

279 for (unsigned i = 0; i < n_send; i++)

280 {

281 send_data[i] = (*this)[Halo_scheme_pt->Haloed_eqns[i]];

282 }

283

284 // Read out the number of entries to receive

285 const unsigned n_receive = Halo_scheme_pt->Halo_eqns.size();

286 Vector<double> receive_data(n_receive);

287

288 // Make sure that the send and receive data have size at least one

289 if (n_send == 0)

290 {

291 send_data.resize(1);

292 }

293 if (n_receive == 0)

294 {

295 receive_data.resize(1);

296 }

297 // Communicate

298 MPI_Alltoallv(&send_data[0],

299 &Halo_scheme_pt->Haloed_n[0],

300 &Halo_scheme_pt->Haloed_displacement[0],

301 MPI_DOUBLE,

302 &receive_data[0],

303 &Halo_scheme_pt->Halo_n[0],

304 &Halo_scheme_pt->Halo_displacement[0],

305 MPI_DOUBLE,

306 this->distribution_pt()->communicator_pt()->mpi_comm());

307

308

309 // Now I need simply to update my local values

310 for (unsigned i = 0; i < n_receive; i++)

311 {

312 Halo_value[Halo_scheme_pt->Halo_eqns[i]] = receive_data[i];

313 }

314 }

315 #endif

316 }

317

318 //=========================================================================

319 /// Gather all ther data from multiple processors and sum the result

320 /// which will be stored in the master copy and then synchronised to

321 /// all copies. This requires two "all to all" communications

322 //====================================================================

323 void DoubleVectorWithHaloEntries::sum_all_halo_and_haloed_values()

324 {

325 #ifdef OOMPH_HAS_MPI

326 // Only need to do anything if the DoubleVector is distributed

327 if (this->distributed())

328 {

329 // Send the Halo entries to the master processor

330 const unsigned n_send = Halo_scheme_pt->Halo_eqns.size();

331 Vector<double> send_data(n_send);

332 // Read out the data values

333 for (unsigned i = 0; i < n_send; i++)

334 {

335 send_data[i] = Halo_value[Halo_scheme_pt->Halo_eqns[i]];

336 }

337

338 // Read out the number of entries to receive

339 const unsigned n_receive = Halo_scheme_pt->Haloed_eqns.size();

340 Vector<double> receive_data(n_receive);

341

342 // Make sure that the send and receive data have size at least one

343 if (n_send == 0)

344 {

345 send_data.resize(1);

346 }

347 if (n_receive == 0)

348 {

349 receive_data.resize(1);

350 }

351 // Communicate

352 MPI_Alltoallv(&send_data[0],

353 &Halo_scheme_pt->Halo_n[0],

354 &Halo_scheme_pt->Halo_displacement[0],

355 MPI_DOUBLE,

356 &receive_data[0],

357 &Halo_scheme_pt->Haloed_n[0],

358 &Halo_scheme_pt->Haloed_displacement[0],

359 MPI_DOUBLE,

360 this->distribution_pt()->communicator_pt()->mpi_comm());

361

362

363 // Now I need simply to update and sum my local values

364 for (unsigned i = 0; i < n_receive; i++)

365 {

366 (*this)[Halo_scheme_pt->Haloed_eqns[i]] += receive_data[i];

367 }

368

369 // Then synchronise

370 this->synchronise();

371 }

372 #endif

373 }

374

375

376 //===================================================================

377 /// Construct the halo scheme and storage for the halo data

378 //=====================================================================

379 void DoubleVectorWithHaloEntries::build_halo_scheme(

380 DoubleVectorHaloScheme* const& halo_scheme_pt)

381 {

382 Halo_scheme_pt = halo_scheme_pt;

383

384 if (Halo_scheme_pt != 0)

385 {

386 // Need to set up the halo data

387 unsigned n_halo_data = halo_scheme_pt->Local_index.size();

388

389 // Resize the halo storage

390 Halo_value.resize(n_halo_data);

391

392 // Now let's get the initial values from the other processors

393 this->synchronise();

394 }

395 }

396

397

398 } // namespace oomph

cstr elem_len * i

Definition: cfortran.h:603

oomph::DistributableLinearAlgebraObject::distributed

bool distributed() const

distribution is serial or distributed

Definition: linear_algebra_distribution.h:493

oomph::DoubleVectorHaloScheme

A class that stores the halo/haloed entries required when using a DoubleVectorWithHaloEntries....

Definition: double_vector_with_halo.h:52

oomph::DoubleVectorHaloScheme::Haloed_n

Vector< int > Haloed_n

Storage for the number of haloed entries to be sent to each processor.

Definition: double_vector_with_halo.h:67

oomph::DoubleVectorHaloScheme::Halo_displacement

Vector< int > Halo_displacement

Storage for the offsets of the processor data in the receive buffer.

Definition: double_vector_with_halo.h:84

oomph::DoubleVectorHaloScheme::Halo_n

Vector< int > Halo_n

Storage for the number of entries to be received from each other processor.

Definition: double_vector_with_halo.h:80

oomph::DoubleVectorHaloScheme::Local_index

std::map< unsigned, unsigned > Local_index

Storage for the translation scheme from global unknown to local index in the additional storage vecto...

Definition: double_vector_with_halo.h:59

oomph::DoubleVectorHaloScheme::Haloed_displacement

Vector< int > Haloed_displacement

Storage for the offsets of the haloed entries for each processor in the packed Haloed_eqns array.

Definition: double_vector_with_halo.h:71

oomph::DoubleVectorHaloScheme::setup_halo_dofs

void setup_halo_dofs(const std::map< unsigned, double * > &halo_data_pt, Vector< double * > &halo_dof_pt)

Function that sets up a vector of pointers to halo data, index using the scheme in Local_index.

Definition: double_vector_with_halo.cc:225

oomph::DoubleVectorHaloScheme::Haloed_eqns

Vector< unsigned > Haloed_eqns

The haloed entries that will be sent in a format compatible with MPI_Alltoallv i.e....

Definition: double_vector_with_halo.h:63

oomph::DoubleVectorHaloScheme::DoubleVectorHaloScheme

DoubleVectorHaloScheme(LinearAlgebraDistribution *const &dist_pt, const Vector< unsigned > &required_global_eqn)

Constructor that sets up the required information communicating between all processors....

Definition: double_vector_with_halo.cc:36

oomph::DoubleVectorHaloScheme::Halo_eqns

Vector< unsigned > Halo_eqns

Storage for all the entries that are to be received from other processors (received_from_proc0,...

Definition: double_vector_with_halo.h:76

oomph::DoubleVectorWithHaloEntries::build_halo_scheme

void build_halo_scheme(DoubleVectorHaloScheme *const &halo_scheme_pt)

Construct the halo scheme and storage for the halo data.

Definition: double_vector_with_halo.cc:379

oomph::DoubleVectorWithHaloEntries::Halo_scheme_pt

DoubleVectorHaloScheme * Halo_scheme_pt

Pointer to the lookup scheme that stores information about on which processor the required informatio...

Definition: double_vector_with_halo.h:153

oomph::DoubleVectorWithHaloEntries::synchronise

void synchronise()

Synchronise the halo data.

Definition: double_vector_with_halo.cc:269

oomph::DoubleVectorWithHaloEntries::sum_all_halo_and_haloed_values

void sum_all_halo_and_haloed_values()

Sum all the data, store in the master (haloed) data and then synchronise.

Definition: double_vector_with_halo.cc:323

oomph::DoubleVectorWithHaloEntries::halo_scheme_pt

DoubleVectorHaloScheme *& halo_scheme_pt()

Access function for halo scheme.

Definition: double_vector_with_halo.h:323

oomph::DoubleVectorWithHaloEntries::Halo_value

Vector< double > Halo_value

Vector of the halo values.

Definition: double_vector_with_halo.h:156

oomph::LinearAlgebraDistribution

Describes the distribution of a distributable linear algebra type object. Typically this is a contain...

Definition: linear_algebra_distribution.h:64

oomph::LinearAlgebraDistribution::distributed

bool distributed() const

access function to the distributed - indicates whether the distribution is serial or distributed

Definition: linear_algebra_distribution.h:329

oomph::LinearAlgebraDistribution::first_row

unsigned first_row() const

access function for the first row on this processor. If not distributed then this is just zero.

Definition: linear_algebra_distribution.h:261

oomph::LinearAlgebraDistribution::communicator_pt

OomphCommunicator * communicator_pt() const

const access to the communicator pointer

Definition: linear_algebra_distribution.h:335

oomph::LinearAlgebraDistribution::rank_of_global_row

unsigned rank_of_global_row(const unsigned i) const

return the processor rank of the global row number i

Definition: linear_algebra_distribution.h:387

oomph::OomphLibError

An OomphLibError object which should be thrown when an run-time error is encountered....

Definition: oomph_definitions.h:222

oomph::Vector< unsigned >

double_vector_with_halo.h

oomph

//////////////////////////////////////////////////////////////////// ////////////////////////////////...

Definition: advection_diffusion_elements.cc:30