Block-Structured AMR Software Framework
Loading...
Searching...
No Matches
AMReX_ParticleTile.H
Go to the documentation of this file.
1#ifndef AMREX_PARTICLETILE_H_
2#define AMREX_PARTICLETILE_H_
3#include <AMReX_Config.H>
4
5#include <AMReX_Extension.H>
6#include <AMReX_Particle.H>
9#include <AMReX_Vector.H>
10#include <AMReX_REAL.H>
11#include <AMReX_RealVect.H>
12
13#include <array>
14#include <atomic>
15#include <string>
16#include <type_traits>
17#include <vector>
18
19
20namespace amrex {
21
22// Forward Declaration
23template <int NArrayReal, int NArrayInt>
24struct ConstSoAParticle;
25template <int NArrayReal, int NArrayInt>
26struct SoAParticle;
27
28template <typename T_ParticleType, int NArrayReal, int NArrayInt>
29struct ConstParticleTileData;
30
32template <typename T_ParticleType, int NArrayReal, int NArrayInt>
34{
35 static constexpr int NAR = NArrayReal;
36 static constexpr int NAI = NArrayInt;
37
38 using ParticleType = T_ParticleType;
39 using ParticleRefType = T_ParticleType&;
42 using IntType = int;
43
44 static constexpr int NStructReal = ParticleType::NReal;
45 static constexpr int NStructInt = ParticleType::NInt;
46
48
49 static constexpr bool is_particle_tile_data = true;
50
52
53 using AOS_PTR = std::conditional_t<T_ParticleType::is_soa_particle,
56
57 uint64_t* m_idcpu;
60
65
67 decltype(auto) pos (const int dir, const int index) const &
68 {
69 if constexpr(!ParticleType::is_soa_particle) {
70 return this->m_aos[index].pos(dir);
71 } else {
72 return this->m_rdata[dir][index];
73 }
74 }
75
77 decltype(auto) id (const int index) const &
78 {
79 if constexpr(!ParticleType::is_soa_particle) {
80 return this->m_aos[index].id();
81 } else {
82 return ParticleIDWrapper(this->m_idcpu[index]);
83 }
84 }
85
87 decltype(auto) cpu (const int index) const &
88 {
89 if constexpr(!ParticleType::is_soa_particle) {
90 return this->m_aos[index].cpu();
91 } else {
92 return ParticleCPUWrapper(this->m_idcpu[index]);
93 }
94 }
95
97 decltype(auto) idcpu (const int index) const &
98 {
99 if constexpr(ParticleType::is_soa_particle) {
100 return this->m_idcpu[index];
101 } else {
102 return this->m_aos[index].idcpu();
103 }
104 }
105
107 ParticleReal * rdata (const int attribute_index) const
108 {
109 return this->m_rdata[attribute_index];
110 }
111
113 int * idata (const int attribute_index) const
114 {
115 return this->m_idata[attribute_index];
116 }
117
119 decltype(auto) operator[] (const int index) const
120 {
121 if constexpr (!ParticleType::is_soa_particle) {
122 return m_aos[index];
123 } else {
124 return SoAParticle<NAR, NAI>(*this, index);
125 }
126 }
127
129 void packParticleData (char* buffer, int src_index, std::size_t dst_offset,
130 const int* comm_real, const int * comm_int) const noexcept
131 {
132 AMREX_ASSERT(src_index < m_size);
133 auto* dst = buffer + dst_offset;
134 if constexpr (!ParticleType::is_soa_particle) {
135 memcpy(dst, m_aos + src_index, sizeof(ParticleType));
136 dst += sizeof(ParticleType);
137 } else {
138 memcpy(dst, m_idcpu + src_index, sizeof(uint64_t));
139 dst += sizeof(uint64_t);
140 }
141 int array_start_index = 0;
142 if constexpr (!ParticleType::is_soa_particle) {
143 array_start_index = AMREX_SPACEDIM + NStructReal;
144 }
145 for (int i = 0; i < NAR; ++i)
146 {
147 if (comm_real[array_start_index + i])
148 {
149 memcpy(dst, m_rdata[i] + src_index, sizeof(ParticleReal));
150 dst += sizeof(ParticleReal);
151 }
152 }
153 int runtime_start_index = array_start_index + NAR;
154 for (int i = 0; i < m_num_runtime_real; ++i)
155 {
156 if (comm_real[runtime_start_index + i])
157 {
158 memcpy(dst, m_runtime_rdata[i] + src_index, sizeof(ParticleReal));
159 dst += sizeof(ParticleReal);
160 }
161 }
162 array_start_index = 2 + NStructInt;
163 for (int i = 0; i < NAI; ++i)
164 {
165 if (comm_int[array_start_index + i])
166 {
167 memcpy(dst, m_idata[i] + src_index, sizeof(int));
168 dst += sizeof(int);
169 }
170 }
171 runtime_start_index = 2 + NStructInt + NAI;
172 for (int i = 0; i < m_num_runtime_int; ++i)
173 {
174 if (comm_int[runtime_start_index + i])
175 {
176 memcpy(dst, m_runtime_idata[i] + src_index, sizeof(int));
177 dst += sizeof(int);
178 }
179 }
180 }
181
183 void unpackParticleData (const char* buffer, Long src_offset, int dst_index,
184 const int* comm_real, const int* comm_int) const noexcept
185 {
186 AMREX_ASSERT(dst_index < m_size);
187 const auto* src = buffer + src_offset;
188 if constexpr (!ParticleType::is_soa_particle) {
189 memcpy(m_aos + dst_index, src, sizeof(ParticleType));
190 src += sizeof(ParticleType);
191 } else {
192 memcpy(m_idcpu + dst_index, src, sizeof(uint64_t));
193 src += sizeof(uint64_t);
194 }
195 int array_start_index = 0;
196 if constexpr (!ParticleType::is_soa_particle) {
197 array_start_index = AMREX_SPACEDIM + NStructReal;
198 }
199 if constexpr (NAR > 0) {
200 for (int i = 0; i < NAR; ++i)
201 {
202 if (comm_real[array_start_index + i])
203 {
204 memcpy(m_rdata[i] + dst_index, src, sizeof(ParticleReal));
205 src += sizeof(ParticleReal);
206 }
207 }
208 }
209 int runtime_start_index = array_start_index + NAR;
210 for (int i = 0; i < m_num_runtime_real; ++i)
211 {
212 if (comm_real[runtime_start_index + i])
213 {
214 memcpy(m_runtime_rdata[i] + dst_index, src, sizeof(ParticleReal));
215 src += sizeof(ParticleReal);
216 }
217 }
218 array_start_index = 2 + NStructInt;
219 if constexpr (NAI > 0) {
220 for (int i = 0; i < NAI; ++i)
221 {
222 if (comm_int[array_start_index + i])
223 {
224 memcpy(m_idata[i] + dst_index, src, sizeof(int));
225 src += sizeof(int);
226 }
227 }
228 }
229 runtime_start_index = 2 + NStructInt + NAI;
230 for (int i = 0; i < m_num_runtime_int; ++i)
231 {
232 if (comm_int[runtime_start_index + i])
233 {
234 memcpy(m_runtime_idata[i] + dst_index, src, sizeof(int));
235 src += sizeof(int);
236 }
237 }
238 }
239
240 template <typename T = ParticleType, std::enable_if_t<!T::is_soa_particle, int> = 0>
242 SuperParticleType getSuperParticle (int index) const noexcept
243 {
244 AMREX_ASSERT(index < m_size);
246 for (int i = 0; i < AMREX_SPACEDIM; ++i) {
247 sp.pos(i) = m_aos[index].pos(i);
248 }
249 for (int i = 0; i < NStructReal; ++i) {
250 sp.rdata(i) = m_aos[index].rdata(i);
251 }
252 if constexpr (NAR >0) {
253 for (int i = 0; i < NAR; ++i) {
254 sp.rdata(NStructReal+i) = m_rdata[i][index];
255 }
256 }
257 sp.id() = m_aos[index].id();
258 sp.cpu() = m_aos[index].cpu();
259 for (int i = 0; i < NStructInt; ++i) {
260 sp.idata(i) = m_aos[index].idata(i);
261 }
262 if constexpr (NAI > 0) {
263 for (int i = 0; i < NAI; ++i) {
264 sp.idata(NStructInt+i) = m_idata[i][index];
265 }
266 }
267 return sp;
268 }
269
270 template <typename T = ParticleType, std::enable_if_t<T::is_soa_particle, int> = 0>
272 SuperParticleType getSuperParticle (int index) const noexcept
273 {
274 AMREX_ASSERT(index < m_size);
276 sp.m_idcpu = m_idcpu[index];
277 for (int i = 0; i < AMREX_SPACEDIM; ++i) {sp.pos(i) = m_rdata[i][index];}
278 for (int i = 0; i < NAR; ++i) {
279 sp.rdata(i) = m_rdata[i][index];
280 }
281 for (int i = 0; i < NAI; ++i) {
282 sp.idata(i) = m_idata[i][index];
283 }
284 return sp;
285 }
286
287 template <typename T = ParticleType, std::enable_if_t<!T::is_soa_particle, int> = 0>
289 void setSuperParticle (const SuperParticleType& sp, int index) const noexcept
290 {
291 for (int i = 0; i < AMREX_SPACEDIM; ++i) {
292 m_aos[index].pos(i) = sp.pos(i);
293 }
294 for (int i = 0; i < NStructReal; ++i) {
295 m_aos[index].rdata(i) = sp.rdata(i);
296 }
297 for (int i = 0; i < NAR; ++i) {
298 m_rdata[i][index] = sp.rdata(NStructReal+i);
299 }
300 m_aos[index].id() = sp.id();
301 m_aos[index].cpu() = sp.cpu();
302 for (int i = 0; i < NStructInt; ++i) {
303 m_aos[index].idata(i) = sp.idata(i);
304 }
305 for (int i = 0; i < NAI; ++i) {
306 m_idata[i][index] = sp.idata(NStructInt+i);
307 }
308 }
309
310 template <typename T = ParticleType, std::enable_if_t<T::is_soa_particle, int> = 0>
312 void setSuperParticle (const SuperParticleType& sp, int index) const noexcept
313 {
314 m_idcpu[index] = sp.m_idcpu;
315 for (int i = 0; i < NAR; ++i) {
316 m_rdata[i][index] = sp.rdata(i);
317 }
318 for (int i = 0; i < NAI; ++i) {
319 m_idata[i][index] = sp.idata(i);
320 }
321 }
322};
323
324// SOA Particle Structure
325template <int T_NArrayReal, int T_NArrayInt>
326struct alignas(sizeof(double)) ConstSoAParticle : SoAParticleBase
327{
328 static constexpr int NArrayReal = T_NArrayReal;
329 static constexpr int NArrayInt = T_NArrayInt;
332 static constexpr bool is_soa_particle = true;
333 static constexpr bool is_rtsoa_particle = false;
334 static constexpr bool is_constsoa_particle = true;
335
337 using IntType = int;
338
340 ConstSoAParticle (ConstPTD const& ptd, long i) : // Note: should this be int instead?
341 m_constparticle_tile_data(ptd), m_index(int(i))
342 {
343 }
344
345 //static Long the_next_id;
346
347 //functions to get id and cpu in the SOA data
348
350 ConstParticleCPUWrapper cpu () const { return this->m_constparticle_tile_data.m_idcpu[m_index]; }
351
353 ConstParticleIDWrapper id () const { return this->m_constparticle_tile_data.m_idcpu[m_index]; }
354
355 //functions to get positions of the particle in the SOA data
356
358 RealVect pos () const & {return RealVect(AMREX_D_DECL(this->m_constparticle_tile_data.m_rdata[0][m_index], this->m_constparticle_tile_data.m_rdata[1][m_index], this->m_constparticle_tile_data.m_rdata[2][m_index]));}
359
361 const RealType& pos (int position_index) const &
362 {
363 AMREX_ASSERT(position_index < AMREX_SPACEDIM);
364 return this->m_constparticle_tile_data.m_rdata[position_index][m_index];
365 }
366
367 static Long NextID ();
368
373
379 static void NextID (Long nextid);
380
381 private :
382
383 static_assert(std::is_trivially_copyable<ConstPTD>(), "ParticleTileData is not trivially copyable");
384
385 ConstPTD m_constparticle_tile_data;
386 int m_index;
387};
388
389template <int T_NArrayReal, int T_NArrayInt>
390struct alignas(sizeof(double)) SoAParticle : SoAParticleBase
391{
392 static constexpr int NArrayReal = T_NArrayReal;
393 static constexpr int NArrayInt = T_NArrayInt;
396 static constexpr bool is_soa_particle = true;
397 static constexpr bool is_rtsoa_particle = false;
398 static constexpr bool is_constsoa_particle = false;
399
402 using IntType = int;
403
405 SoAParticle (PTD const& ptd, long i) : // Note: should this be int instead?
406 m_particle_tile_data(ptd), m_index(int(i))
407 {
408 }
409
411
412 //functions to get id and cpu in the SOA data
413
415 ParticleCPUWrapper cpu () & { return this->m_particle_tile_data.m_idcpu[m_index]; }
416
418 ParticleIDWrapper<> id () & { return this->m_particle_tile_data.m_idcpu[m_index]; }
419
421 uint64_t& idcpu () & { return this->m_particle_tile_data.m_idcpu[m_index]; }
422
424 ConstParticleCPUWrapper cpu () const & { return this->m_particle_tile_data.m_idcpu[m_index]; }
425
427 ConstParticleIDWrapper id () const & { return this->m_particle_tile_data.m_idcpu[m_index]; }
428
430 const uint64_t& idcpu () const & { return this->m_particle_tile_data.m_idcpu[m_index]; }
431
432 //functions to get positions of the particle in the SOA data
433
435 RealVect pos () const & {return RealVect(AMREX_D_DECL(this->m_particle_tile_data.m_rdata[0][m_index], this->m_particle_tile_data.m_rdata[1][m_index], this->m_particle_tile_data.m_rdata[2][m_index]));}
436
438 RealType& pos (int position_index) &
439 {
440 AMREX_ASSERT(position_index < AMREX_SPACEDIM);
441 return this->m_particle_tile_data.m_rdata[position_index][m_index];
442 }
443
445 RealType pos (int position_index) const &
446 {
447 AMREX_ASSERT(position_index < AMREX_SPACEDIM);
448 return this->m_particle_tile_data.m_rdata[position_index][m_index];
449 }
450
451 static Long NextID ();
452
456 static Long UnprotectedNextID ();
457
463 static void NextID (Long nextid);
464
465private :
466
467 static_assert(std::is_trivially_copyable<PTD>(), "ParticleTileData is not trivially copyable");
468
469 PTD m_particle_tile_data;
470 int m_index;
471};
472
473//template <int NArrayReal, int NArrayInt> Long ConstSoAParticle<NArrayReal, NArrayInt>::the_next_id = 1;
474template <int NArrayReal, int NArrayInt> Long SoAParticle<NArrayReal, NArrayInt>::the_next_id = 1;
475
476template <int NArrayReal, int NArrayInt>
477Long
479{
480 Long next;
481// we should be able to test on _OPENMP < 201107 for capture (version 3.1)
482// but we must work around a bug in gcc < 4.9
483#if defined(AMREX_USE_OMP) && defined(_OPENMP) && _OPENMP < 201307
484#pragma omp critical (amrex_particle_nextid)
485#elif defined(AMREX_USE_OMP)
486#pragma omp atomic capture
487#endif
488 next = the_next_id++;
489
491 amrex::Abort("SoAParticle<NArrayReal, NArrayInt>::NextID() -- too many particles");
492 }
493
494 return next;
495}
496
497template <int NArrayReal, int NArrayInt>
498Long
500{
501 Long next = the_next_id++;
503 amrex::Abort("SoAParticle<NArrayReal, NArrayInt>::NextID() -- too many particles");
504 }
505 return next;
506}
507
508template <int NArrayReal, int NArrayInt>
509void
511{
512 the_next_id = nextid;
513}
514
515template <typename T_ParticleType, int NArrayReal, int NArrayInt>
517{
518 static constexpr int NAR = NArrayReal;
519 static constexpr int NAI = NArrayInt;
520 using ParticleType = T_ParticleType;
521 using ParticleRefType = T_ParticleType const&;
523 using IntType = int;
524
525 static constexpr int NStructReal = ParticleType::NReal;
526 static constexpr int NStructInt = ParticleType::NInt;
527
529
530 static constexpr bool is_particle_tile_data = true;
531
533
534 using AOS_PTR = std::conditional_t<T_ParticleType::is_soa_particle,
535 void const * AMREX_RESTRICT, ParticleType const * AMREX_RESTRICT>;
537
538 const uint64_t* m_idcpu;
541
543 decltype(auto) pos (const int dir, const int index) const &
544 {
545 if constexpr(!ParticleType::is_soa_particle) {
546 return this->m_aos[index].pos(dir);
547 } else {
548 return this->m_rdata[dir][index];
549 }
550 }
551
553 decltype(auto) id (const int index) const &
554 {
555 if constexpr(!ParticleType::is_soa_particle) {
556 return this->m_aos[index].id();
557 } else {
558 return ConstParticleIDWrapper(this->m_idcpu[index]);
559 }
560 }
561
563 decltype(auto) cpu (const int index) const &
564 {
565 if constexpr(!ParticleType::is_soa_particle) {
566 return this->m_aos[index].cpu();
567 } else {
568 return ConstParticleCPUWrapper(this->m_idcpu[index]);
569 }
570 }
571
573 decltype(auto) idcpu (const int index) const &
574 {
575 if constexpr(ParticleType::is_soa_particle) {
576 return this->m_idcpu[index];
577 } else {
578 return this->m_aos[index].idcpu();
579 }
580 }
581
583 const ParticleReal * rdata (const int attribute_index) const
584 {
585 return this->m_rdata[attribute_index];
586 }
587
589 const int * idata (const int attribute_index) const
590 {
591 return this->m_idata[attribute_index];
592 }
593
595 decltype(auto) operator[] (const int index) const
596 {
597 if constexpr (!ParticleType::is_soa_particle) {
598 return m_aos[index];
599 } else {
600 return ConstSoAParticle<NAR, NAI>(*this, index);
601 }
602 }
603
608
610 void packParticleData(char* buffer, int src_index, Long dst_offset,
611 const int* comm_real, const int * comm_int) const noexcept
612 {
613 AMREX_ASSERT(src_index < m_size);
614 auto* dst = buffer + dst_offset;
615 if constexpr (!ParticleType::is_soa_particle) {
616 memcpy(dst, m_aos + src_index, sizeof(ParticleType));
617 dst += sizeof(ParticleType);
618 } else {
619 memcpy(dst, m_idcpu + src_index, sizeof(uint64_t));
620 dst += sizeof(uint64_t);
621 }
622 int array_start_index = 0;
623 if constexpr (!ParticleType::is_soa_particle) {
624 array_start_index = AMREX_SPACEDIM + NStructReal;
625 }
626 if constexpr (NArrayReal > 0) {
627 for (int i = 0; i < NArrayReal; ++i)
628 {
629 if (comm_real[array_start_index + i])
630 {
631 memcpy(dst, m_rdata[i] + src_index, sizeof(ParticleReal));
632 dst += sizeof(ParticleReal);
633 }
634 }
635 }
636 int runtime_start_index = array_start_index + NArrayReal;
637 for (int i = 0; i < m_num_runtime_real; ++i)
638 {
639 if (comm_real[runtime_start_index + i])
640 {
641 memcpy(dst, m_runtime_rdata[i] + src_index, sizeof(ParticleReal));
642 dst += sizeof(ParticleReal);
643 }
644 }
645 array_start_index = 2 + NStructInt;
646 if constexpr (NArrayInt > 0) {
647 for (int i = 0; i < NArrayInt; ++i)
648 {
649 if (comm_int[array_start_index + i])
650 {
651 memcpy(dst, m_idata[i] + src_index, sizeof(int));
652 dst += sizeof(int);
653 }
654 }
655 }
656 runtime_start_index = 2 + NStructInt + NArrayInt;
657 for (int i = 0; i < m_num_runtime_int; ++i)
658 {
659 if (comm_int[runtime_start_index + i])
660 {
661 memcpy(dst, m_runtime_idata[i] + src_index, sizeof(int));
662 dst += sizeof(int);
663 }
664 }
665 }
666
667 template <typename T = ParticleType, std::enable_if_t<!T::is_soa_particle, int> = 0>
669 SuperParticleType getSuperParticle (int index) const noexcept
670 {
671 AMREX_ASSERT(index < m_size);
673 for (int i = 0; i < AMREX_SPACEDIM; ++i) {
674 sp.pos(i) = m_aos[index].pos(i);
675 }
676 for (int i = 0; i < NStructReal; ++i) {
677 sp.rdata(i) = m_aos[index].rdata(i);
678 }
679 if constexpr(NArrayReal > 0) {
680 for (int i = 0; i < NArrayReal; ++i) {
681 sp.rdata(NStructReal+i) = m_rdata[i][index];
682 }
683 }
684 sp.id() = m_aos[index].id();
685 sp.cpu() = m_aos[index].cpu();
686 for (int i = 0; i < NStructInt; ++i) {
687 sp.idata(i) = m_aos[index].idata(i);
688 }
689 if constexpr(NArrayInt > 0) {
690 for (int i = 0; i < NArrayInt; ++i) {
691 sp.idata(NStructInt+i) = m_idata[i][index];
692 }
693 }
694 return sp;
695 }
696
697 template <typename T = ParticleType, std::enable_if_t<T::is_soa_particle, int> = 0>
699 SuperParticleType getSuperParticle (int index) const noexcept
700 {
701 AMREX_ASSERT(index < m_size);
703 for (int i = 0; i < AMREX_SPACEDIM; ++i) {sp.pos(i) = m_rdata[i][index];}
704 sp.m_idcpu = m_idcpu[index];
705 for (int i = 0; i < NAR; ++i) {
706 sp.rdata(i) = m_rdata[i][index];
707 }
708 for (int i = 0; i < NAI; ++i) {
709 sp.idata(i) = m_idata[i][index];
710 }
711 return sp;
712 }
713};
714
716
720
722{
723 RuntimePtrCacheDirtyFlag () noexcept = default;
724
726
728 : m_value(true)
729 {}
730
732 : m_value(true)
733 {}
734
736 {
737 m_value.store(true, std::memory_order_relaxed);
738 return *this;
739 }
740
742 {
743 m_value.store(true, std::memory_order_relaxed);
744 return *this;
745 }
746
747 void store (bool value, std::memory_order order = std::memory_order_seq_cst) noexcept
748 {
749 m_value.store(value, order);
750 }
751
752 [[nodiscard]] bool load (std::memory_order order = std::memory_order_seq_cst) const noexcept
753 {
754 return m_value.load(order);
755 }
756
757private:
758 std::atomic<bool> m_value {true};
759};
760
761template <typename T_ParticleType, int NArrayReal, int NArrayInt,
762 template<class> class Allocator=DefaultAllocator>
764{
765 template <typename T>
766 using AllocatorType = Allocator<T>;
767
768 using ParticleType = T_ParticleType;
769 static constexpr int NAR = NArrayReal;
770 static constexpr int NAI = NArrayInt;
771 using RealType = typename ParticleType::RealType;
772
773 static constexpr int NStructReal = ParticleType::NReal;
774 static constexpr int NStructInt = ParticleType::NInt;
775
777
778 using AoS = std::conditional_t<
779 ParticleType::is_soa_particle,
782 using ParticleVector = typename AoS::ParticleVector;
783
784 using SoA = std::conditional_t<
785 ParticleType::is_soa_particle,
788 using RealVector = typename SoA::RealVector;
789 using IntVector = typename SoA::IntVector;
790 using StorageParticleType = typename ParticleType::StorageParticleType;
791
794
795 static constexpr bool has_polymorphic_allocator =
797
798 ParticleTile () = default;
799
800#ifndef _WIN32 // workaround windows compiler bug
801 ~ParticleTile () = default;
802
803 ParticleTile (ParticleTile const&) = delete;
804 ParticleTile (ParticleTile &&) noexcept = default;
805
806 ParticleTile& operator= (ParticleTile const&) = delete;
807 ParticleTile& operator= (ParticleTile &&) noexcept = default;
808#endif
809
810 void define (
811 int a_num_runtime_real,
812 int a_num_runtime_int,
813 std::vector<std::string>* soa_rdata_names=nullptr,
814 std::vector<std::string>* soa_idata_names=nullptr,
815 Arena* a_arena=nullptr
816 )
817 {
818 GetStructOfArrays().define(a_num_runtime_real, a_num_runtime_int, soa_rdata_names, soa_idata_names);
819 m_runtime_r_ptrs.resize(a_num_runtime_real);
820 m_runtime_i_ptrs.resize(a_num_runtime_int);
821 m_runtime_r_cptrs.resize(a_num_runtime_real);
822 m_runtime_i_cptrs.resize(a_num_runtime_int);
823
824 if constexpr (has_polymorphic_allocator) {
825 if (m_defined) {
826 // it is not allowed to change the arena after the tile has been defined
827 if constexpr (ParticleType::is_soa_particle) {
829 a_arena == GetStructOfArrays().GetIdCPUData().arena(),
830 "ParticleTile with PolymorphicArenaAllocator redefined with "
831 "different memory arena");
832 } else {
834 a_arena == m_aos_tile().arena(),
835 "ParticleTile with PolymorphicArenaAllocator redefined with "
836 "different memory arena");
837 }
838 }
839
840 AMREX_ALWAYS_ASSERT_WITH_MESSAGE(a_arena != nullptr,
841 "ParticleTile with PolymorphicArenaAllocator defined with no memory arena! "
842 "Make sure to call setArena() on the ParticleContainer before initialization or "
843 "to pass an Arena to ParticleTile::define()");
844
845 if constexpr (ParticleType::is_soa_particle) {
846 GetStructOfArrays().GetIdCPUData().setArena(a_arena);
847 } else {
848 m_aos_tile().setArena(a_arena);
849 }
850 for (int j = 0; j < NumRealComps(); ++j) {
851 GetStructOfArrays().GetRealData(j).setArena(a_arena);
852 }
853 for (int j = 0; j < NumIntComps(); ++j) {
854 GetStructOfArrays().GetIntData(j).setArena(a_arena);
855 }
856 }
857
858 m_defined = true;
859 invalidateRuntimePtrCaches();
860 }
861
862 // Get id data
863 decltype(auto) id (int index) & {
864 if constexpr (!ParticleType::is_soa_particle) {
865 return m_aos_tile[index].id();
866 } else {
867 return ParticleIDWrapper(m_soa_tile.GetIdCPUData()[index]);
868 }
869 }
870
871 // const
872 decltype(auto) id (int index) const & {
873 if constexpr (!ParticleType::is_soa_particle) {
874 return m_aos_tile[index].id();
875 } else {
876 return ConstParticleIDWrapper(m_soa_tile.GetIdCPUData()[index]);
877 }
878 }
879
880 // Get cpu data
881 decltype(auto) cpu (int index) & {
882 if constexpr (!ParticleType::is_soa_particle) {
883 return m_aos_tile[index].cpu();
884 } else {
885 return ParticleCPUWrapper(m_soa_tile.GetIdCPUData()[index]);
886 }
887 }
888
889 // const
890 decltype(auto) cpu (int index) const & {
891 if constexpr (!ParticleType::is_soa_particle) {
892 return m_aos_tile[index].cpu();
893 } else {
894 return ConstParticleCPUWrapper(m_soa_tile.GetIdCPUData()[index]);
895 }
896 }
897
898 // Get positions data
899 RealType& pos (int index, int position_index) & {
900 if constexpr (!ParticleType::is_soa_particle) {
901 return m_aos_tile[index].pos(position_index);
902 } else {
903 static_assert(NArrayReal == ParticleType::PTD::NAR, "ParticleTile mismatch in R");
904 static_assert(NArrayInt == ParticleType::PTD::NAI, "ParticleTile mismatch in I");
905 static_assert(0 == ParticleType::StorageParticleType::NReal, "ParticleTile 2 mismatch in R");
906 static_assert(0 == ParticleType::StorageParticleType::NInt, "ParticleTile 2 mismatch in I");
907
908 return m_soa_tile.GetRealData(position_index)[index];
909 }
910 }
911
912 // const
913 RealType pos (int index, int position_index) const &
914 {
915 if constexpr (!ParticleType::is_soa_particle) {
916 return m_aos_tile[index].pos(position_index);
917 } else {
918 return m_soa_tile.GetRealData(position_index)[index];
919 }
920 }
921
922 AoS& GetArrayOfStructs () { invalidateRuntimePtrCaches(); return m_aos_tile; }
923 const AoS& GetArrayOfStructs () const { return m_aos_tile; }
924
925 SoA& GetStructOfArrays () { invalidateRuntimePtrCaches(); return m_soa_tile; }
926 const SoA& GetStructOfArrays () const { return m_soa_tile; }
927
928 bool empty () const { return size() == 0; }
929
934 std::size_t size () const
935 {
936 if constexpr (!ParticleType::is_soa_particle) {
937 return m_aos_tile.size();
938 } else {
939 return m_soa_tile.size();
940 }
941 }
942
947 int numParticles () const
948 {
949 if constexpr (!ParticleType::is_soa_particle) {
950 return m_aos_tile.numParticles();
951 } else {
952 return m_soa_tile.numParticles();
953 }
954 }
955
960 int numRealParticles () const
961 {
962 if constexpr (!ParticleType::is_soa_particle) {
963 return m_aos_tile.numRealParticles();
964 } else {
965 return m_soa_tile.numRealParticles();
966 }
967 }
968
974 {
975 if constexpr (!ParticleType::is_soa_particle) {
976 return m_aos_tile.numNeighborParticles();
977 } else {
978 return m_soa_tile.numNeighborParticles();
979 }
980 }
981
986 int numTotalParticles () const
987 {
988 if constexpr (!ParticleType::is_soa_particle) {
989 return m_aos_tile.numTotalParticles();
990 } else {
991 return m_soa_tile.numTotalParticles();
992 }
993 }
994
995 void setNumNeighbors (int num_neighbors)
996 {
997 invalidateRuntimePtrCaches();
998 if constexpr(!ParticleType::is_soa_particle) {
999 m_aos_tile.setNumNeighbors(num_neighbors);
1000 }
1001 m_soa_tile.setNumNeighbors(num_neighbors);
1002 }
1003
1004 int getNumNeighbors () const
1005 {
1006 if constexpr (!ParticleType::is_soa_particle) {
1007 AMREX_ASSERT( m_soa_tile.getNumNeighbors() == m_aos_tile.getNumNeighbors() );
1008 return m_aos_tile.getNumNeighbors();
1009 } else {
1010 return m_soa_tile.getNumNeighbors();
1011 }
1012 }
1013
1014 void resize (std::size_t count, GrowthStrategy strategy = GrowthStrategy::Poisson)
1015 {
1016 invalidateRuntimePtrCaches();
1017 if constexpr (!ParticleType::is_soa_particle) {
1018 m_aos_tile.resize(count, strategy);
1019 }
1020 m_soa_tile.resize(count, strategy);
1021 }
1022
1024 {
1025 invalidateRuntimePtrCaches();
1026 if constexpr (!ParticleType::is_soa_particle) {
1027 m_aos_tile.reserve(capacity, strategy);
1028 }
1029 m_soa_tile.reserve(capacity, strategy);
1030 }
1031
1035 template <typename T = ParticleType, std::enable_if_t<!T::is_soa_particle, int> = 0>
1036 void push_back (const ParticleType& p)
1037 {
1038 invalidateRuntimePtrCaches();
1039 m_aos_tile().push_back(p);
1040 }
1041
1045 template < int NR = NArrayReal, int NI = NArrayInt,
1046 std::enable_if_t<NR != 0 || NI != 0, int> foo = 0>
1048 {
1049 invalidateRuntimePtrCaches();
1050 auto np = numParticles();
1051
1052 if constexpr (!ParticleType::is_soa_particle) {
1053 m_aos_tile.resize(np+1);
1054 for (int i = 0; i < AMREX_SPACEDIM; ++i) {
1055 m_aos_tile[np].pos(i) = sp.pos(i);
1056 }
1057 for (int i = 0; i < NStructReal; ++i) {
1058 m_aos_tile[np].rdata(i) = sp.rdata(i);
1059 }
1060 m_aos_tile[np].id() = sp.id();
1061 m_aos_tile[np].cpu() = sp.cpu();
1062 for (int i = 0; i < NStructInt; ++i) {
1063 m_aos_tile[np].idata(i) = sp.idata(i);
1064 }
1065 }
1066
1067 m_soa_tile.resize(np+1);
1068 if constexpr (ParticleType::is_soa_particle) {
1069 m_soa_tile.GetIdCPUData()[np] = sp.m_idcpu;
1070 }
1071 auto& arr_rdata = m_soa_tile.GetRealData();
1072 auto& arr_idata = m_soa_tile.GetIntData();
1073 for (int i = 0; i < NArrayReal; ++i) {
1074 arr_rdata[i][np] = sp.rdata(NStructReal+i);
1075 }
1076 for (int i = 0; i < NArrayInt; ++i) {
1077 arr_idata[i][np] = sp.idata(NStructInt+i);
1078 }
1079 }
1080
1085 void push_back_real (int comp, ParticleReal v) {
1086 invalidateRuntimePtrCaches();
1087 m_soa_tile.GetRealData(comp).push_back(v);
1088 }
1089
1094 void push_back_real (const std::array<ParticleReal, NArrayReal>& v) {
1095 for (int i = 0; i < NArrayReal; ++i) {
1096 m_soa_tile.GetRealData(i).push_back(v[i]);
1097 }
1098 }
1099
1104 void push_back_real (int comp, const ParticleReal* beg, const ParticleReal* end) {
1105 invalidateRuntimePtrCaches();
1106 auto it = m_soa_tile.GetRealData(comp).end();
1107 m_soa_tile.GetRealData(comp).insert(it, beg, end);
1108 }
1109
1117
1123 push_back_real(comp, vec.cbegin(), vec.cend());
1124 }
1125
1130 void push_back_real (int comp, std::size_t npar, ParticleReal v) {
1131 invalidateRuntimePtrCaches();
1132 auto new_size = m_soa_tile.GetRealData(comp).size() + npar;
1133 m_soa_tile.GetRealData(comp).resize(new_size, v);
1134 }
1135
1140 void push_back_int (int comp, int v) {
1141 invalidateRuntimePtrCaches();
1142 m_soa_tile.GetIntData(comp).push_back(v);
1143 }
1144
1149 void push_back_int (const std::array<int, NArrayInt>& v) {
1150 for (int i = 0; i < NArrayInt; ++i) {
1151 m_soa_tile.GetIntData(i).push_back(v[i]);
1152 }
1153 }
1154
1159 void push_back_int (int comp, const int* beg, const int* end) {
1160 invalidateRuntimePtrCaches();
1161 auto it = m_soa_tile.GetIntData(comp).end();
1162 m_soa_tile.GetIntData(comp).insert(it, beg, end);
1163 }
1164
1172
1177 void push_back_int (int comp, amrex::Vector<int> const & vec) {
1178 push_back_int(comp, vec.cbegin(), vec.cend());
1179 }
1180
1185 void push_back_int (int comp, std::size_t npar, int v) {
1186 invalidateRuntimePtrCaches();
1187 auto new_size = m_soa_tile.GetIntData(comp).size() + npar;
1188 m_soa_tile.GetIntData(comp).resize(new_size, v);
1189 }
1190
1191 int NumRealComps () const noexcept { return m_soa_tile.NumRealComps(); }
1192
1193 int NumIntComps () const noexcept { return m_soa_tile.NumIntComps(); }
1194
1195 int NumRuntimeRealComps () const noexcept { return m_runtime_r_ptrs.size(); }
1196
1197 int NumRuntimeIntComps () const noexcept { return m_runtime_i_ptrs.size(); }
1198
1200 {
1201 invalidateRuntimePtrCaches();
1202 if constexpr (ParticleType::is_soa_particle) {
1203 GetStructOfArrays().GetIdCPUData().shrink_to_fit();
1204 } else {
1205 m_aos_tile().shrink_to_fit();
1206 }
1207 for (int j = 0; j < NumRealComps(); ++j)
1208 {
1209 auto& rdata = GetStructOfArrays().GetRealData(j);
1210 rdata.shrink_to_fit();
1211 }
1212
1213 for (int j = 0; j < NumIntComps(); ++j)
1214 {
1215 auto& idata = GetStructOfArrays().GetIntData(j);
1216 idata.shrink_to_fit();
1217 }
1218 }
1219
1221 {
1222 Long nbytes = 0;
1223 if constexpr (ParticleType::is_soa_particle) {
1224 nbytes += GetStructOfArrays().GetIdCPUData().capacity() * sizeof(uint64_t);
1225 } else {
1226 nbytes += m_aos_tile().capacity() * sizeof(ParticleType);
1227 }
1228 for (int j = 0; j < NumRealComps(); ++j)
1229 {
1230 auto& rdata = GetStructOfArrays().GetRealData(j);
1231 nbytes += rdata.capacity() * sizeof(ParticleReal);
1232 }
1233
1234 for (int j = 0; j < NumIntComps(); ++j)
1235 {
1236 auto& idata = GetStructOfArrays().GetIntData(j);
1237 nbytes += idata.capacity()*sizeof(int);
1238 }
1239 return nbytes;
1240 }
1241
1243 {
1244 if constexpr (ParticleType::is_soa_particle) {
1245 GetStructOfArrays().GetIdCPUData().swap(other.GetStructOfArrays().GetIdCPUData());
1246 } else {
1247 m_aos_tile().swap(other.GetArrayOfStructs()());
1248 }
1249 for (int j = 0; j < NumRealComps(); ++j)
1250 {
1251 auto& rdata = GetStructOfArrays().GetRealData(j);
1252 rdata.swap(other.GetStructOfArrays().GetRealData(j));
1253 }
1254
1255 for (int j = 0; j < NumIntComps(); ++j)
1256 {
1257 auto& idata = GetStructOfArrays().GetIntData(j);
1258 idata.swap(other.GetStructOfArrays().GetIntData(j));
1259 }
1260 invalidateRuntimePtrCaches();
1261 other.invalidateRuntimePtrCaches();
1262 }
1263
1265 {
1266 refreshRuntimePtrCaches();
1267
1269 if constexpr (!ParticleType::is_soa_particle) {
1270 ptd.m_aos = m_aos_tile().dataPtr();
1271 } else {
1272 ptd.m_aos = nullptr;
1273 }
1274 if constexpr (ParticleType::is_soa_particle) {
1275 ptd.m_idcpu = m_soa_tile.GetIdCPUData().dataPtr();
1276 } else {
1277 ptd.m_idcpu = nullptr;
1278 }
1279 if constexpr(NArrayReal > 0) {
1280 for (int i = 0; i < NArrayReal; ++i) {
1281 ptd.m_rdata[i] = m_soa_tile.GetRealData(i).dataPtr();
1282 }
1283 }
1284 if constexpr(NArrayInt > 0) {
1285 for (int i = 0; i < NArrayInt; ++i) {
1286 ptd.m_idata[i] = m_soa_tile.GetIntData(i).dataPtr();
1287 }
1288 }
1289 ptd.m_size = size();
1290 ptd.m_num_runtime_real = m_runtime_r_ptrs.size();
1291 ptd.m_num_runtime_int = m_runtime_i_ptrs.size();
1292 ptd.m_runtime_rdata = m_runtime_r_ptrs.dataPtr();
1293 ptd.m_runtime_idata = m_runtime_i_ptrs.dataPtr();
1294
1295 return ptd;
1296 }
1297
1299 {
1300 refreshConstRuntimePtrCaches();
1301
1303 if constexpr (!ParticleType::is_soa_particle) {
1304 ptd.m_aos = m_aos_tile().dataPtr();
1305 } else {
1306 ptd.m_aos = nullptr;
1307 }
1308 if constexpr (ParticleType::is_soa_particle) {
1309 ptd.m_idcpu = m_soa_tile.GetIdCPUData().dataPtr();
1310 } else {
1311 ptd.m_idcpu = nullptr;
1312 }
1313 if constexpr(NArrayReal > 0) {
1314 for (int i = 0; i < NArrayReal; ++i) {
1315 ptd.m_rdata[i] = m_soa_tile.GetRealData(i).dataPtr();
1316 }
1317 }
1318 if constexpr(NArrayInt > 0) {
1319 for (int i = 0; i < NArrayInt; ++i) {
1320 ptd.m_idata[i] = m_soa_tile.GetIntData(i).dataPtr();
1321 }
1322 }
1323 ptd.m_size = size();
1324 ptd.m_num_runtime_real = m_runtime_r_cptrs.size();
1325 ptd.m_num_runtime_int = m_runtime_i_cptrs.size();
1326 ptd.m_runtime_rdata = m_runtime_r_cptrs.dataPtr();
1327 ptd.m_runtime_idata = m_runtime_i_cptrs.dataPtr();
1328
1329 return ptd;
1330 }
1331
1335 {
1336 invalidateRuntimePtrCaches();
1337 if constexpr (!ParticleType::is_soa_particle) {
1338 m_aos_tile.collectVectors(pv);
1339 } else {
1341 }
1342 m_soa_tile.collectVectors(idcpuv, rv, iv);
1343 }
1344
1345 static void reserve (std::map<ParticleTile<T_ParticleType,NArrayReal,NArrayInt,Allocator>*, int> const& addsizes)
1346 {
1347 if constexpr (!IsArenaAllocator<Allocator<int>>::value) {
1348 for (auto [p,s] : addsizes) {
1349 p->reserve(p->size()+s);
1350 }
1351 } else {
1352 using PV = std::conditional_t<ParticleType::is_soa_particle,
1358 for (auto [p,s] : addsizes) {
1359 if (s > 0) {
1364 p->collectVectors(pv, idcpuv, rv, iv);
1365 if constexpr (!ParticleType::is_soa_particle) {
1366 for (auto* v : pv) {
1367 pvs.emplace_back(v, s);
1368 }
1369 }
1370 for (auto* v : idcpuv) {
1371 ids.emplace_back(v, s);
1372 }
1373 for (auto* v : rv) {
1374 rvs.emplace_back(v, s);
1375 }
1376 for (auto* v : iv) {
1377 ivs.emplace_back(v, s);
1378 }
1379 }
1380 }
1381
1382 std::sort(pvs.begin(), pvs.end(), [] (auto const& a, auto const& b) {
1383 return (a.first->size() + a.second) >
1384 (b.first->size() + b.second);
1385 });
1386 std::sort(ids.begin(), ids.end(), [] (auto const& a, auto const& b) {
1387 return (a.first->size() + a.second) >
1388 (b.first->size() + b.second);
1389 });
1390 std::sort(rvs.begin(), rvs.end(), [] (auto const& a, auto const& b) {
1391 return (a.first->size() + a.second) >
1392 (b.first->size() + b.second);
1393 });
1394 std::sort(ivs.begin(), ivs.end(), [] (auto const& a, auto const& b) {
1395 return (a.first->size() + a.second) >
1396 (b.first->size() + b.second);
1397 });
1398
1399 // Handle big vectors first
1400 {
1401 int i_pvs = 0, i_ids = 0, i_rvs = 0, i_ivs = 0;
1402 auto n_pvs = int(pvs.size());
1403 auto n_ids = int(ids.size());
1404 auto n_rvs = int(rvs.size());
1405 auto n_ivs = int(ivs.size());
1406 while ((i_pvs < n_pvs) || (i_ids < n_ids) || (i_rvs < n_rvs) ||
1407 (i_ivs < n_ivs)) {
1408 std::size_t nbytes = 0;
1409 int ii = -1;
1410 if (i_pvs < n_pvs) {
1411 std::size_t my_bytes = (pvs[i_pvs].first->size()
1412 + pvs[i_pvs].second) * sizeof(typename PV::value_type);
1413 if (my_bytes > nbytes) {
1414 nbytes = my_bytes;
1415 ii = 0;
1416 }
1417 }
1418 if (i_ids < n_ids) {
1419 std::size_t my_bytes = (ids[i_ids].first->size()
1420 + ids[i_ids].second) * sizeof(typename SoA::IdCPU::value_type);
1421 if (my_bytes > nbytes) {
1422 nbytes = my_bytes;
1423 ii = 1;
1424 }
1425 }
1426 if (i_rvs < n_rvs) {
1427 std::size_t my_bytes = (rvs[i_rvs].first->size()
1428 + rvs[i_rvs].second) * sizeof(typename RealVector::value_type);
1429 if (my_bytes > nbytes) {
1430 nbytes = my_bytes;
1431 ii = 2;
1432 }
1433 }
1434 if (i_ivs < n_ivs) {
1435 std::size_t my_bytes = (ivs[i_ivs].first->size()
1436 + ivs[i_ivs].second) * sizeof(typename IntVector::value_type);
1437 if (my_bytes > nbytes) {
1438 nbytes = my_bytes;
1439 ii = 3;
1440 }
1441 }
1442 if (ii == 0) {
1443 auto [p,s] = pvs[i_pvs++];
1444 p->reserve(p->size() + s);
1445 } else if (ii == 1) {
1446 auto [p,s] = ids[i_ids++];
1447 p->reserve(p->size() + s);
1448 } else if (ii == 2) {
1449 auto [p,s] = rvs[i_rvs++];
1450 p->reserve(p->size() + s);
1451 } else {
1452 auto [p,s] = ivs[i_ivs++];
1453 p->reserve(p->size() + s);
1454 }
1455 }
1456 }
1457 }
1458 }
1459
1460private:
1461
1462 void invalidateRuntimePtrCaches () noexcept
1463 {
1464 m_runtime_ptrs_dirty.store(true, std::memory_order_release);
1465 m_runtime_cptrs_dirty.store(true, std::memory_order_release);
1466 }
1467
1468 void refreshRuntimePtrCaches ()
1469 {
1470 if (!m_runtime_ptrs_dirty.load(std::memory_order_acquire)) {
1471 return;
1472 }
1473#if defined(AMREX_USE_OMP)
1474#pragma omp critical (amrex_particle_tile_data_cache)
1475#endif
1476 {
1477 if (m_runtime_ptrs_dirty.load(std::memory_order_relaxed)) {
1478 m_runtime_r_ptrs.resize(m_soa_tile.NumRealComps() - NArrayReal);
1479 m_runtime_i_ptrs.resize(m_soa_tile.NumIntComps() - NArrayInt);
1480#ifdef AMREX_USE_GPU
1481 bool copy_real = false;
1482 m_h_runtime_r_ptrs.resize(m_soa_tile.NumRealComps() - NArrayReal, nullptr);
1483 for (std::size_t i = 0; i < m_h_runtime_r_ptrs.size(); ++i) {
1484 if (m_h_runtime_r_ptrs[i] != m_soa_tile.GetRealData(i + NArrayReal).dataPtr()) {
1485 m_h_runtime_r_ptrs[i] = m_soa_tile.GetRealData(i + NArrayReal).dataPtr();
1486 copy_real = true;
1487 }
1488 }
1489 if (copy_real) {
1490 Gpu::htod_memcpy_async(m_runtime_r_ptrs.data(), m_h_runtime_r_ptrs.data(),
1491 m_h_runtime_r_ptrs.size()*sizeof(ParticleReal*));
1492 }
1493
1494 bool copy_int = false;
1495 m_h_runtime_i_ptrs.resize(m_soa_tile.NumIntComps() - NArrayInt, nullptr);
1496 for (std::size_t i = 0; i < m_h_runtime_i_ptrs.size(); ++i) {
1497 if (m_h_runtime_i_ptrs[i] != m_soa_tile.GetIntData(i + NArrayInt).dataPtr()) {
1498 m_h_runtime_i_ptrs[i] = m_soa_tile.GetIntData(i + NArrayInt).dataPtr();
1499 copy_int = true;
1500 }
1501 }
1502 if (copy_int) {
1503 Gpu::htod_memcpy_async(m_runtime_i_ptrs.data(), m_h_runtime_i_ptrs.data(),
1504 m_h_runtime_i_ptrs.size()*sizeof(int*));
1505 }
1506
1507 if (copy_real || copy_int) {
1509 }
1510#else
1511 for (std::size_t i = 0; i < m_runtime_r_ptrs.size(); ++i) {
1512 m_runtime_r_ptrs[i] = m_soa_tile.GetRealData(i + NArrayReal).dataPtr();
1513 }
1514
1515 for (std::size_t i = 0; i < m_runtime_i_ptrs.size(); ++i) {
1516 m_runtime_i_ptrs[i] = m_soa_tile.GetIntData(i + NArrayInt).dataPtr();
1517 }
1518#endif
1519 m_runtime_ptrs_dirty.store(false, std::memory_order_release);
1520 }
1521 }
1522 }
1523
1524 void refreshConstRuntimePtrCaches () const
1525 {
1526 if (!m_runtime_cptrs_dirty.load(std::memory_order_acquire)) {
1527 return;
1528 }
1529#if defined(AMREX_USE_OMP)
1530#pragma omp critical (amrex_const_particle_tile_data_cache)
1531#endif
1532 {
1533 if (m_runtime_cptrs_dirty.load(std::memory_order_relaxed)) {
1534 m_runtime_r_cptrs.resize(m_soa_tile.NumRealComps() - NArrayReal);
1535 m_runtime_i_cptrs.resize(m_soa_tile.NumIntComps() - NArrayInt);
1536#ifdef AMREX_USE_GPU
1537 bool copy_real = false;
1538 m_h_runtime_r_cptrs.resize(m_soa_tile.NumRealComps() - NArrayReal, nullptr);
1539 for (std::size_t i = 0; i < m_h_runtime_r_cptrs.size(); ++i) {
1540 if (m_h_runtime_r_cptrs[i] != m_soa_tile.GetRealData(i + NArrayReal).dataPtr()) {
1541 m_h_runtime_r_cptrs[i] = m_soa_tile.GetRealData(i + NArrayReal).dataPtr();
1542 copy_real = true;
1543 }
1544 }
1545 if (copy_real) {
1546 Gpu::htod_memcpy_async(m_runtime_r_cptrs.data(), m_h_runtime_r_cptrs.data(),
1547 m_h_runtime_r_cptrs.size()*sizeof(ParticleReal*));
1548 }
1549
1550 bool copy_int = false;
1551 m_h_runtime_i_cptrs.resize(m_soa_tile.NumIntComps() - NArrayInt, nullptr);
1552 for (std::size_t i = 0; i < m_h_runtime_i_cptrs.size(); ++i) {
1553 if (m_h_runtime_i_cptrs[i] != m_soa_tile.GetIntData(i + NArrayInt).dataPtr()) {
1554 m_h_runtime_i_cptrs[i] = m_soa_tile.GetIntData(i + NArrayInt).dataPtr();
1555 copy_int = true;
1556 }
1557 }
1558 if (copy_int) {
1559 Gpu::htod_memcpy_async(m_runtime_i_cptrs.data(), m_h_runtime_i_cptrs.data(),
1560 m_h_runtime_i_cptrs.size()*sizeof(int*));
1561 }
1562
1563 if (copy_real || copy_int) {
1565 }
1566#else
1567 for (std::size_t i = 0; i < m_runtime_r_cptrs.size(); ++i) {
1568 m_runtime_r_cptrs[i] = m_soa_tile.GetRealData(i + NArrayReal).dataPtr();
1569 }
1570
1571 for (std::size_t i = 0; i < m_runtime_i_cptrs.size(); ++i) {
1572 m_runtime_i_cptrs[i] = m_soa_tile.GetIntData(i + NArrayInt).dataPtr();
1573 }
1574#endif
1575 m_runtime_cptrs_dirty.store(false, std::memory_order_release);
1576 }
1577 }
1578 }
1579
1580 AoS m_aos_tile;
1581 SoA m_soa_tile;
1582
1583 bool m_defined = false;
1584
1586 amrex::PODVector<int*, Allocator<int*> > m_runtime_i_ptrs;
1587
1589 mutable amrex::PODVector<const int*, Allocator<const int*> >m_runtime_i_cptrs;
1590
1591 amrex::Gpu::HostVector<ParticleReal*> m_h_runtime_r_ptrs;
1592 amrex::Gpu::HostVector<int*> m_h_runtime_i_ptrs;
1593
1594 mutable amrex::Gpu::HostVector<const ParticleReal*> m_h_runtime_r_cptrs;
1595 mutable amrex::Gpu::HostVector<const int*> m_h_runtime_i_cptrs;
1596
1597 RuntimePtrCacheDirtyFlag m_runtime_ptrs_dirty;
1598 mutable RuntimePtrCacheDirtyFlag m_runtime_cptrs_dirty;
1599};
1600
1601} // namespace amrex
1602
1603#endif // AMREX_PARTICLETILE_H_
#define AMREX_ALWAYS_ASSERT_WITH_MESSAGE(EX, MSG)
Definition AMReX_BLassert.H:49
#define AMREX_ASSERT(EX)
Definition AMReX_BLassert.H:38
#define AMREX_FORCE_INLINE
Definition AMReX_Extension.H:119
#define AMREX_RESTRICT
Definition AMReX_Extension.H:32
#define AMREX_GPU_HOST_DEVICE
Definition AMReX_GpuQualifiers.H:20
#define AMREX_D_DECL(a, b, c)
Definition AMReX_SPACE.H:171
A virtual base class for objects that manage their own dynamic memory allocation.
Definition AMReX_Arena.H:132
Definition AMReX_ArrayOfStructs.H:13
Dynamically allocated vector for trivially copyable data.
Definition AMReX_PODVector.H:308
This class is a thin wrapper around std::vector. Unlike vector, Vector::operator[] provides bound che...
Definition AMReX_Vector.H:28
Long size() const noexcept
Definition AMReX_Vector.H:53
amrex_particle_real ParticleReal
Floating Point Type for Particles.
Definition AMReX_REAL.H:90
amrex_long Long
Definition AMReX_INT.H:30
void streamSynchronize() noexcept
Definition AMReX_GpuDevice.H:310
void htod_memcpy_async(void *p_d, const void *p_h, const std::size_t sz) noexcept
Definition AMReX_GpuDevice.H:421
constexpr Long LastParticleID
Definition AMReX_Particle.H:21
Definition AMReX_Amr.cpp:50
__host__ __device__ void ignore_unused(const Ts &...)
This shuts up the compiler about unused variables.
Definition AMReX.H:139
amrex::ArenaAllocator< T > DefaultAllocator
Definition AMReX_GpuAllocators.H:205
GrowthStrategy
Definition AMReX_PODVector.H:250
RealVectND< 3 > RealVect
Definition AMReX_ParmParse.H:36
void Abort(const std::string &msg)
Print out message to cerr and exit via abort().
Definition AMReX.cpp:241
const int[]
Definition AMReX_BLProfiler.cpp:1664
__host__ __device__ Dim3 end(BoxND< dim > const &box) noexcept
Definition AMReX_Box.H:2015
Definition AMReX_Particle.H:327
Definition AMReX_Particle.H:301
static constexpr bool is_particle_tile_data
Definition AMReX_ParticleTile.H:530
static constexpr int NAI
Definition AMReX_ParticleTile.H:519
int IntType
Definition AMReX_ParticleTile.H:523
GpuArray< const int *, NArrayInt > m_idata
Definition AMReX_ParticleTile.H:540
__host__ __device__ decltype(auto) idcpu(const int index) const &
Definition AMReX_ParticleTile.H:573
__host__ __device__ const int * idata(const int attribute_index) const
Definition AMReX_ParticleTile.H:589
Long m_size
Definition AMReX_ParticleTile.H:532
T_ParticleType ParticleType
Definition AMReX_ParticleTile.H:520
static constexpr int NStructReal
Definition AMReX_ParticleTile.H:525
__host__ __device__ void packParticleData(char *buffer, int src_index, Long dst_offset, const int *comm_real, const int *comm_int) const noexcept
Definition AMReX_ParticleTile.H:610
int m_num_runtime_real
Definition AMReX_ParticleTile.H:604
static constexpr int NStructInt
Definition AMReX_ParticleTile.H:526
const int *__restrict__ *__restrict__ m_runtime_idata
Definition AMReX_ParticleTile.H:607
ParticleReal RealType
Definition AMReX_ParticleTile.H:522
__host__ __device__ decltype(auto) pos(const int dir, const int index) const &
Definition AMReX_ParticleTile.H:543
__host__ __device__ decltype(auto) cpu(const int index) const &
Definition AMReX_ParticleTile.H:563
int m_num_runtime_int
Definition AMReX_ParticleTile.H:605
std::conditional_t< T_ParticleType::is_soa_particle, void const *__restrict__, ParticleType const *__restrict__ > AOS_PTR
Definition AMReX_ParticleTile.H:535
T_ParticleType const & ParticleRefType
Definition AMReX_ParticleTile.H:521
static constexpr int NAR
Definition AMReX_ParticleTile.H:518
AOS_PTR m_aos
Definition AMReX_ParticleTile.H:536
const uint64_t * m_idcpu
Definition AMReX_ParticleTile.H:538
__host__ __device__ SuperParticleType getSuperParticle(int index) const noexcept
Definition AMReX_ParticleTile.H:669
__host__ __device__ const ParticleReal * rdata(const int attribute_index) const
Definition AMReX_ParticleTile.H:583
GpuArray< const ParticleReal *, NArrayReal > m_rdata
Definition AMReX_ParticleTile.H:539
const ParticleReal *__restrict__ *__restrict__ m_runtime_rdata
Definition AMReX_ParticleTile.H:606
Definition AMReX_ParticleTile.H:327
__host__ __device__ ConstParticleIDWrapper id() const
Definition AMReX_ParticleTile.H:353
static constexpr int NArrayReal
Definition AMReX_ParticleTile.H:328
ParticleReal RealType
Definition AMReX_ParticleTile.H:336
__host__ __device__ ConstSoAParticle(ConstPTD const &ptd, long i)
Definition AMReX_ParticleTile.H:340
static constexpr int NArrayInt
Definition AMReX_ParticleTile.H:329
static constexpr bool is_rtsoa_particle
Definition AMReX_ParticleTile.H:333
static void NextID(Long nextid)
Reset on restart.
static constexpr bool is_constsoa_particle
Definition AMReX_ParticleTile.H:334
static Long UnprotectedNextID()
This version can only be used inside omp critical.
__host__ __device__ const RealType & pos(int position_index) const &
Definition AMReX_ParticleTile.H:361
__host__ __device__ RealVect pos() const &
Definition AMReX_ParticleTile.H:358
__host__ __device__ ConstParticleCPUWrapper cpu() const
Definition AMReX_ParticleTile.H:350
int IntType
Definition AMReX_ParticleTile.H:337
Fixed-size array that can be used on GPU.
Definition AMReX_Array.H:43
Definition AMReX_GpuAllocators.H:173
Definition AMReX_GpuAllocators.H:184
uint64_t m_idcpu
Definition AMReX_Particle.H:359
Definition AMReX_Particle.H:259
Definition AMReX_Particle.H:154
Definition AMReX_ParticleTile.H:34
__host__ __device__ SuperParticleType getSuperParticle(int index) const noexcept
Definition AMReX_ParticleTile.H:242
T_ParticleType & ParticleRefType
Definition AMReX_ParticleTile.H:39
__host__ __device__ decltype(auto) cpu(const int index) const &
Definition AMReX_ParticleTile.H:87
uint64_t * m_idcpu
Definition AMReX_ParticleTile.H:57
GpuArray< ParticleReal *, NAR > m_rdata
Definition AMReX_ParticleTile.H:58
__host__ __device__ void unpackParticleData(const char *buffer, Long src_offset, int dst_index, const int *comm_real, const int *comm_int) const noexcept
Definition AMReX_ParticleTile.H:183
__host__ __device__ decltype(auto) idcpu(const int index) const &
Definition AMReX_ParticleTile.H:97
__host__ __device__ ParticleReal * rdata(const int attribute_index) const
Definition AMReX_ParticleTile.H:107
__host__ __device__ void packParticleData(char *buffer, int src_index, std::size_t dst_offset, const int *comm_real, const int *comm_int) const noexcept
Definition AMReX_ParticleTile.H:129
static constexpr int NStructInt
Definition AMReX_ParticleTile.H:45
GpuArray< int *, NAI > m_idata
Definition AMReX_ParticleTile.H:59
ParticleReal RealType
Definition AMReX_ParticleTile.H:41
__host__ __device__ decltype(auto) pos(const int dir, const int index) const &
Definition AMReX_ParticleTile.H:67
T_ParticleType ParticleType
Definition AMReX_ParticleTile.H:38
std::conditional_t< T_ParticleType::is_soa_particle, void *__restrict__, ParticleType *__restrict__ > AOS_PTR
Definition AMReX_ParticleTile.H:54
int m_num_runtime_int
Definition AMReX_ParticleTile.H:62
Long m_size
Definition AMReX_ParticleTile.H:51
static constexpr int NAR
Definition AMReX_ParticleTile.H:35
int IntType
Definition AMReX_ParticleTile.H:42
ParticleReal *__restrict__ *__restrict__ m_runtime_rdata
Definition AMReX_ParticleTile.H:63
int m_num_runtime_real
Definition AMReX_ParticleTile.H:61
static constexpr bool is_particle_tile_data
Definition AMReX_ParticleTile.H:49
__host__ __device__ int * idata(const int attribute_index) const
Definition AMReX_ParticleTile.H:113
AOS_PTR m_aos
Definition AMReX_ParticleTile.H:55
static constexpr int NAI
Definition AMReX_ParticleTile.H:36
int *__restrict__ *__restrict__ m_runtime_idata
Definition AMReX_ParticleTile.H:64
__host__ __device__ void setSuperParticle(const SuperParticleType &sp, int index) const noexcept
Definition AMReX_ParticleTile.H:289
static constexpr int NStructReal
Definition AMReX_ParticleTile.H:44
Definition AMReX_ParticleTile.H:764
typename ParticleType::StorageParticleType StorageParticleType
Definition AMReX_ParticleTile.H:790
int NumRealComps() const noexcept
Definition AMReX_ParticleTile.H:1191
void push_back_real(int comp, amrex::Vector< amrex::ParticleReal > const &vec)
Definition AMReX_ParticleTile.H:1122
int NumIntComps() const noexcept
Definition AMReX_ParticleTile.H:1193
typename ParticleType::RealType RealType
Definition AMReX_ParticleTile.H:771
ParticleTile()=default
int getNumNeighbors() const
Definition AMReX_ParticleTile.H:1004
typename AoS::ParticleVector ParticleVector
Definition AMReX_ParticleTile.H:782
void push_back(const ParticleType &p)
Definition AMReX_ParticleTile.H:1036
ParticleTile(ParticleTile const &)=delete
std::conditional_t< ParticleType::is_soa_particle, StructOfArrays< NArrayReal, NArrayInt, Allocator, true >, StructOfArrays< NArrayReal, NArrayInt, Allocator, false > > SoA
Definition AMReX_ParticleTile.H:787
const SoA & GetStructOfArrays() const
Definition AMReX_ParticleTile.H:926
static constexpr int NAI
Definition AMReX_ParticleTile.H:770
ParticleTile(ParticleTile &&) noexcept=default
void push_back_real(int comp, const ParticleReal *beg, const ParticleReal *end)
Definition AMReX_ParticleTile.H:1104
static constexpr int NStructInt
Definition AMReX_ParticleTile.H:774
void setNumNeighbors(int num_neighbors)
Definition AMReX_ParticleTile.H:995
Long capacity() const
Definition AMReX_ParticleTile.H:1220
int numTotalParticles() const
Returns the total number of particles, real and neighbor.
Definition AMReX_ParticleTile.H:986
std::size_t size() const
Returns the total number of particles (real and neighbor)
Definition AMReX_ParticleTile.H:934
static constexpr bool has_polymorphic_allocator
Definition AMReX_ParticleTile.H:795
ParticleTileDataType getParticleTileData()
Definition AMReX_ParticleTile.H:1264
void reserve(std::size_t capacity, GrowthStrategy strategy=GrowthStrategy::Poisson)
Definition AMReX_ParticleTile.H:1023
void push_back(const SuperParticleType &sp)
Definition AMReX_ParticleTile.H:1047
int numNeighborParticles() const
Returns the number of neighbor particles (excluding reals)
Definition AMReX_ParticleTile.H:973
~ParticleTile()=default
const AoS & GetArrayOfStructs() const
Definition AMReX_ParticleTile.H:923
static constexpr int NAR
Definition AMReX_ParticleTile.H:769
ConstParticleTileDataType getConstParticleTileData() const
Definition AMReX_ParticleTile.H:1298
void shrink_to_fit()
Definition AMReX_ParticleTile.H:1199
T_ParticleType ParticleType
Definition AMReX_ParticleTile.H:768
int numParticles() const
Returns the number of real particles (excluding neighbors)
Definition AMReX_ParticleTile.H:947
void push_back_int(int comp, amrex::Vector< int > const &vec)
Definition AMReX_ParticleTile.H:1177
void resize(std::size_t count, GrowthStrategy strategy=GrowthStrategy::Poisson)
Definition AMReX_ParticleTile.H:1014
void swap(ParticleTile< ParticleType, NArrayReal, NArrayInt, Allocator > &other) noexcept
Definition AMReX_ParticleTile.H:1242
void push_back_int(int comp, amrex::Vector< int >::const_iterator beg, amrex::Vector< int >::const_iterator end)
Definition AMReX_ParticleTile.H:1169
void push_back_real(const std::array< ParticleReal, NArrayReal > &v)
Definition AMReX_ParticleTile.H:1094
int NumRuntimeRealComps() const noexcept
Definition AMReX_ParticleTile.H:1195
void collectVectors(Vector< ParticleVector * > &pv, Vector< typename SoA::IdCPU * > &idcpuv, Vector< RealVector * > &rv, Vector< IntVector * > &iv)
Definition AMReX_ParticleTile.H:1332
AoS & GetArrayOfStructs()
Definition AMReX_ParticleTile.H:922
RealType & pos(int index, int position_index) &
Definition AMReX_ParticleTile.H:899
typename SoA::IntVector IntVector
Definition AMReX_ParticleTile.H:789
void push_back_int(const std::array< int, NArrayInt > &v)
Definition AMReX_ParticleTile.H:1149
void push_back_real(int comp, amrex::Vector< amrex::ParticleReal >::const_iterator beg, amrex::Vector< amrex::ParticleReal >::const_iterator end)
Definition AMReX_ParticleTile.H:1114
Allocator< T > AllocatorType
Definition AMReX_ParticleTile.H:766
int NumRuntimeIntComps() const noexcept
Definition AMReX_ParticleTile.H:1197
bool empty() const
Definition AMReX_ParticleTile.H:928
void push_back_int(int comp, int v)
Definition AMReX_ParticleTile.H:1140
RealType pos(int index, int position_index) const &
Definition AMReX_ParticleTile.H:913
decltype(auto) cpu(int index) &
Definition AMReX_ParticleTile.H:881
void define(int a_num_runtime_real, int a_num_runtime_int, std::vector< std::string > *soa_rdata_names=nullptr, std::vector< std::string > *soa_idata_names=nullptr, Arena *a_arena=nullptr)
Definition AMReX_ParticleTile.H:810
SoA & GetStructOfArrays()
Definition AMReX_ParticleTile.H:925
void push_back_int(int comp, std::size_t npar, int v)
Definition AMReX_ParticleTile.H:1185
void push_back_real(int comp, std::size_t npar, ParticleReal v)
Definition AMReX_ParticleTile.H:1130
void push_back_int(int comp, const int *beg, const int *end)
Definition AMReX_ParticleTile.H:1159
typename SoA::RealVector RealVector
Definition AMReX_ParticleTile.H:788
int numRealParticles() const
Returns the number of real particles (excluding neighbors)
Definition AMReX_ParticleTile.H:960
std::conditional_t< ParticleType::is_soa_particle, ThisParticleTileHasNoAoS, ArrayOfStructs< ParticleType, Allocator > > AoS
Definition AMReX_ParticleTile.H:781
static constexpr int NStructReal
Definition AMReX_ParticleTile.H:773
void push_back_real(int comp, ParticleReal v)
Definition AMReX_ParticleTile.H:1085
static void reserve(std::map< ParticleTile< T_ParticleType, NArrayReal, NArrayInt, Allocator > *, int > const &addsizes)
Definition AMReX_ParticleTile.H:1345
The struct used to store particles.
Definition AMReX_Particle.H:405
__host__ __device__ RealVect pos() const &
Definition AMReX_Particle.H:456
__host__ __device__ int & idata(int index) &
Definition AMReX_Particle.H:545
__host__ __device__ ParticleCPUWrapper cpu() &
Definition AMReX_Particle.H:424
__host__ __device__ ParticleIDWrapper id() &
Definition AMReX_Particle.H:427
__host__ __device__ RealType & rdata(int index) &
Definition AMReX_Particle.H:474
Definition AMReX_ParticleTile.H:722
RuntimePtrCacheDirtyFlag(RuntimePtrCacheDirtyFlag &&) noexcept
Definition AMReX_ParticleTile.H:731
RuntimePtrCacheDirtyFlag() noexcept=default
void store(bool value, std::memory_order order=std::memory_order_seq_cst) noexcept
Definition AMReX_ParticleTile.H:747
bool load(std::memory_order order=std::memory_order_seq_cst) const noexcept
Definition AMReX_ParticleTile.H:752
RuntimePtrCacheDirtyFlag & operator=(RuntimePtrCacheDirtyFlag const &) noexcept
Definition AMReX_ParticleTile.H:735
Definition AMReX_Particle.H:388
Definition AMReX_ParticleTile.H:391
static constexpr int NArrayReal
Definition AMReX_ParticleTile.H:392
ParticleTileData< SoAParticleBase, NArrayReal, NArrayInt > PTD
Definition AMReX_ParticleTile.H:395
__host__ __device__ uint64_t & idcpu() &
Definition AMReX_ParticleTile.H:421
static Long UnprotectedNextID()
This version can only be used inside omp critical.
Definition AMReX_ParticleTile.H:499
__host__ __device__ ConstParticleCPUWrapper cpu() const &
Definition AMReX_ParticleTile.H:424
static Long the_next_id
Definition AMReX_ParticleTile.H:410
static constexpr int NArrayInt
Definition AMReX_ParticleTile.H:393
__host__ __device__ const uint64_t & idcpu() const &
Definition AMReX_ParticleTile.H:430
__host__ __device__ RealVect pos() const &
Definition AMReX_ParticleTile.H:435
ParticleReal RealType
Definition AMReX_ParticleTile.H:401
__host__ __device__ ParticleCPUWrapper cpu() &
Definition AMReX_ParticleTile.H:415
__host__ __device__ ParticleIDWrapper id() &
Definition AMReX_ParticleTile.H:418
static constexpr bool is_constsoa_particle
Definition AMReX_ParticleTile.H:398
__host__ __device__ RealType & pos(int position_index) &
Definition AMReX_ParticleTile.H:438
static constexpr bool is_rtsoa_particle
Definition AMReX_ParticleTile.H:397
int IntType
Definition AMReX_ParticleTile.H:402
__host__ __device__ SoAParticle(PTD const &ptd, long i)
Definition AMReX_ParticleTile.H:405
__host__ __device__ ConstParticleIDWrapper id() const &
Definition AMReX_ParticleTile.H:427
static Long NextID()
Definition AMReX_ParticleTile.H:478
__host__ __device__ RealType pos(int position_index) const &
Definition AMReX_ParticleTile.H:445
Definition AMReX_StructOfArrays.H:20
Definition AMReX_ParticleTile.H:717
Definition AMReX_ParticleTile.H:715
Definition AMReX_MakeParticle.H:13