Realm
A distributed, event-based tasking library
Loading...
Searching...
No Matches
transfer.h
Go to the documentation of this file.
1/*
2 * Copyright 2025 Stanford University, NVIDIA Corporation
3 * SPDX-License-Identifier: Apache-2.0
4 *
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 */
17
18// data transfer (a.k.a. dma) engine for Realm
19
20#ifndef REALM_TRANSFER_H
21#define REALM_TRANSFER_H
22
23#include "realm/event.h"
24#include "realm/memory.h"
25#include "realm/indexspace.h"
26#include "realm/atomics.h"
27#include "realm/network.h"
28#include "realm/operation.h"
30#include "realm/profiling.h"
31
32namespace Realm {
33
34 // the data transfer engine has too much code to have it all be templated on the
35 // type of IndexSpace that is driving the transfer, so we need a widget that
36 // can hold an arbitrary IndexSpace and dispatch based on its type
37
38 class XferDes;
39 class AddressList;
40
42 public:
43 template <typename S>
44 static TransferIterator *deserialize_new(S &deserializer);
45
46 virtual ~TransferIterator(void);
47
48 // must be called (and waited on) before iteration is possible
49 virtual Event request_metadata(void);
50
51 // specify the xd port used for indirect address flow control, if any
52 virtual void set_indirect_input_port(XferDes *xd, int port_idx,
53 TransferIterator *inner_iter);
54
55 virtual void reset(void) = 0;
56 virtual bool done(void) = 0;
57 virtual size_t get_base_offset(void) const;
58 virtual size_t get_address_size(void) const;
59
60 // flag bits to control iterators
61 enum
62 {
63 SRC_PARTIAL_OK = (1 << 0),
64 SRC_LINES_OK = (1 << 1),
65 SRC_PLANES_OK = (1 << 2),
67
68 DST_PARTIAL_OK = (1 << 8),
69 DST_LINES_OK = (1 << 9),
70 DST_PLANES_OK = (1 << 10),
71 DST_FLAGMASK = 0xff00,
72
76 };
77
78 struct AddressInfo {
80 size_t bytes_per_chunk; // multiple of sizeof(T) unless PARTIAL_OK
81 size_t num_lines; // guaranteed to be 1 unless LINES_OK (i.e. 2D)
83 size_t num_planes; // guaranteed to be 1 unless PLANES_OK (i.e. 3D)
85 };
86
87 // a custom address info interface for cases where linearized
88 // addresses are not suitable
90 protected:
91 virtual ~AddressInfoCustom() {}
92
93 public:
94 // offers an N-D rectangle from a given piece of a given instance,
95 // along with a specified dimension order
96 // return value is how many dimensions are accepted (0 = single
97 // point), which can be less than the input if the target has
98 // strict ordering rules
99 virtual int set_rect(const RegionInstanceImpl *inst,
100 const InstanceLayoutPieceBase *piece, size_t field_size,
101 size_t field_offset, int ndims, const int64_t lo[/*ndims*/],
102 const int64_t hi[/*ndims*/], const int order[/*ndims*/]) = 0;
103 };
104
105 // if a step is tentative, it must either be confirmed or cancelled before
106 // another one is possible
107 virtual size_t step(size_t max_bytes, AddressInfo &info, unsigned flags,
108 bool tentative = false) = 0;
109 virtual size_t step_custom(size_t max_bytes, AddressInfoCustom &info,
110 bool tentative = false) = 0;
111
112 virtual void confirm_step(void) = 0;
113 virtual void cancel_step(void) = 0;
114
115 virtual bool get_addresses(AddressList &addrlist,
116 const InstanceLayoutPieceBase *&nonaffine) = 0;
117 };
118
120 //
121 // class TransferIteratorBase<N,T>
122 //
123
124 template <int N, typename T>
126 protected:
127 TransferIteratorBase(void); // used by deserializer
128 public:
129 TransferIteratorBase(RegionInstanceImpl *_inst_impl, const int _dim_order[N]);
130
131 virtual Event request_metadata(void);
132
133 virtual void reset(void);
134 virtual bool done(void);
135 virtual size_t step(size_t max_bytes, AddressInfo &info, unsigned flags,
136 bool tentative = false);
137 virtual size_t step_custom(size_t max_bytes, AddressInfoCustom &info,
138 bool tentative = false);
139
140 virtual void confirm_step(void);
141 virtual void cancel_step(void);
142
143 virtual size_t get_base_offset(void) const;
144
145 virtual bool get_addresses(AddressList &addrlist,
146 const InstanceLayoutPieceBase *&nonaffine);
147
148 protected:
149 virtual bool get_next_rect(Rect<N, T> &r, FieldID &fid, size_t &offset,
150 size_t &fsize) = 0;
151
157 bool carry;
158
160 // InstanceLayout<N, T> *inst_layout;
163 int dim_order[N];
164 };
165
167 //
168 // class TransferIteratorIndexSpace<N,T>
169 //
170
171 template <int N, typename T>
173 protected:
174 TransferIteratorIndexSpace(void); // used by deserializer
175 public:
176 TransferIteratorIndexSpace(const int _dim_order[N],
177 const std::vector<FieldID> &_fields,
178 const std::vector<size_t> &_fld_offsets,
179 const std::vector<size_t> &_fld_sizes,
180 RegionInstanceImpl *_inst_impl,
181 const IndexSpace<N, T> &_is);
182
183 TransferIteratorIndexSpace(const int _dim_order[N],
184 const std::vector<FieldID> &_fields,
185 const std::vector<size_t> &_fld_offsets,
186 const std::vector<size_t> &_fld_sizes,
187 RegionInstanceImpl *_inst_impl, const Rect<N, T> &_bounds,
188 SparsityMapImpl<N, T> *_sparsity_impl);
189
190 template <typename S>
191 static TransferIterator *deserialize_new(S &deserializer);
192
194
195 virtual Event request_metadata(void);
196
197 virtual void reset(void);
198
202
203 template <typename S>
204 bool serialize(S &serializer) const;
205
206 protected:
207 void reset_internal(void);
208 virtual bool get_next_rect(Rect<N, T> &r, FieldID &fid, size_t &offset,
209 size_t &fsize);
210
215 std::vector<FieldID> fields;
216 std::vector<size_t> fld_offsets, fld_sizes;
217 size_t field_idx{0};
218 };
219
220 template <int N, typename T>
222 protected:
223 TransferIteratorIndirect(void); // used by deserializer
224 public:
226 const std::vector<FieldID> &_fields,
227 const std::vector<size_t> &_fld_offsets,
228 const std::vector<size_t> &_fld_sizes);
229
230 template <typename S>
231 static TransferIterator *deserialize_new(S &deserializer);
232
234
235 virtual Event request_metadata(void);
236
237 // specify the xd port used for indirect address flow control, if any
238 virtual void set_indirect_input_port(XferDes *xd, int port_idx,
239 TransferIterator *inner_iter);
240 virtual void reset(void);
241
245
246 template <typename S>
247 bool serialize(S &serializer) const;
248
249 protected:
250 virtual bool get_next_rect(Rect<N, T> &r, FieldID &fid, size_t &offset,
251 size_t &fsize);
252
255 intptr_t addrs_mem_base{0};
256 bool can_merge{true};
257 static constexpr size_t MAX_POINTS = 64;
259 size_t point_pos{0}, num_points{0};
260 std::vector<FieldID> fields;
261 std::vector<size_t> fld_offsets, fld_sizes;
264 };
265
267 protected:
269
270 public:
271 template <typename S>
272 static TransferDomain *deserialize_new(S &deserializer);
273
274 template <int N, typename T>
276
277 virtual TransferDomain *clone(void) const = 0;
278
279 virtual ~TransferDomain(void);
280
281 virtual Event request_metadata(void) = 0;
282
283 virtual bool empty(void) const = 0;
284 virtual size_t volume(void) const = 0;
285
286 virtual void choose_dim_order(std::vector<int> &dim_order,
287 const std::vector<CopySrcDstField> &srcs,
288 const std::vector<CopySrcDstField> &dsts,
289 const std::vector<IndirectionInfo *> &indirects,
290 bool force_fortran_order, size_t max_stride) const = 0;
291
292 virtual void count_fragments(RegionInstance inst, const std::vector<int> &dim_order,
293 const std::vector<FieldID> &fields,
294 const std::vector<size_t> &fld_sizes,
295 std::vector<size_t> &fragments) const = 0;
296
297 virtual TransferIterator *
298 create_iterator(RegionInstance inst, const std::vector<int> &dim_order,
299 const std::vector<FieldID> &fields,
300 const std::vector<size_t> &fld_offsets,
301 const std::vector<size_t> &fld_sizes) const = 0;
302
303 virtual TransferIterator *
305 const std::vector<FieldID> &fields,
306 const std::vector<size_t> &fld_offsets,
307 const std::vector<size_t> &fld_sizes) const = 0;
308
309 virtual void print(std::ostream &os) const = 0;
310 };
311
312 class TransferOperation;
313
314 // copies with generalized scatter and gather have a DAG that describes
315 // the overall transfer: nodes are transfer descriptors and edges are
316 // intermediate buffers
318 struct XDTemplate {
319 // TODO(apryakhin@): Remove target_node
321 // XferDesKind kind;
326 Channel *channel = nullptr;
327
335 struct IO {
337 union {
338 struct {
340 unsigned fld_start;
341 unsigned fld_count;
343 struct {
344 unsigned ind_idx;
345 unsigned port;
347 unsigned fld_start;
348 unsigned fld_count;
350 unsigned edge;
351 struct {
352 unsigned fill_start;
353 unsigned fill_size;
356 };
357 };
358 static IO mk_inst(RegionInstance _inst, unsigned _fld_start, unsigned _fld_count);
359 static IO mk_indirect(unsigned _ind_idx, unsigned _port, RegionInstance _inst,
360 unsigned _fld_start, unsigned _fld_count);
361 static IO mk_edge(unsigned _edge);
362 static IO mk_fill(unsigned _fill_start, unsigned _fill_size, size_t _fill_total);
363
364 std::vector<IO> inputs; // TODO: short vectors
365 std::vector<IO> outputs;
366
367 // helper functions for initializing these things
368 void set_simple(Channel *channel, int in_edge, int out_edge);
369 };
370 struct IBInfo {
372 size_t size;
373 };
374 std::vector<XDTemplate> xd_nodes;
375 std::vector<IBInfo> ib_edges;
376 std::vector<unsigned> ib_alloc_order;
377 };
378
380 public:
381 // Copy the srcs, dsts, and indirects
382 template <int N, typename T>
384 IndexSpace<N, T> _is, const std::vector<CopySrcDstField> &_srcs,
385 const std::vector<CopySrcDstField> &_dsts,
386 const std::vector<const typename CopyIndirection<N, T>::Base *> &_indirects,
387 const ProfilingRequestSet &requests);
388
389 // Move the srcs, dsts, and indirects
390 template <int N, typename T>
392 IndexSpace<N, T> _is, std::vector<CopySrcDstField> &&_srcs,
393 std::vector<CopySrcDstField> &&_dsts,
394 const std::vector<const typename CopyIndirection<N, T>::Base *> &_indirects,
395 const ProfilingRequestSet &requests);
396
397 private:
398 template <int N, typename T, typename SrcVec, typename DstVec>
400 IndexSpace<N, T> _is, SrcVec &&_srcs, DstVec &&_dsts,
401 const std::vector<const typename CopyIndirection<N, T>::Base *> &_indirects,
402 const ProfilingRequestSet &requests,
403 std::true_type); // the true_type is used to disambiguate the constructor
404
405 protected:
406 // reference-counted - do not delete directly
408
409 public:
412
413 // returns true if the analysis is complete, and ib allocation can proceed
414 // if the analysis isn't, returns false and op->allocate_ibs() will be
415 // called once it is
417
423
424 protected:
426
429 void cancel_analysis(Event failed_precondition);
430
432 public:
434 virtual void event_triggered(bool poisoned, TimeLimit work_until);
435 virtual void print(std::ostream &os) const;
436 virtual Event get_finish_event(void) const;
437
440 };
442
443 friend class TransferOperation;
444
446 std::vector<CopySrcDstField> srcs, dsts;
447 std::vector<IndirectionInfo *> indirects;
449
453 std::vector<TransferOperation *> pending_ops;
455 std::vector<int> dim_order;
456 std::vector<FieldInfo> src_fields, dst_fields;
458 size_t fill_size;
461 };
462
464 public:
465 virtual ~IndirectionInfo(void) {}
466 virtual Event request_metadata(void) = 0;
467
468 virtual void
469 generate_gather_paths(const Node *node_info, Memory dst_mem,
470 TransferGraph::XDTemplate::IO dst_edge, unsigned indirect_idx,
471 unsigned src_fld_start, unsigned src_fld_count,
472 size_t bytes_per_element, CustomSerdezID serdez_id,
473 std::vector<TransferGraph::XDTemplate> &xd_nodes,
474 std::vector<TransferGraph::IBInfo> &ib_edges,
475 std::vector<TransferDesc::FieldInfo> &src_fields) = 0;
476
478 Memory src_mem, TransferGraph::XDTemplate::IO src_edge, unsigned indirect_idx,
479 unsigned dst_fld_start, unsigned dst_fld_count, size_t bytes_per_element,
480 CustomSerdezID serdez_id, std::vector<TransferGraph::XDTemplate> &xd_nodes,
481 std::vector<TransferGraph::IBInfo> &ib_edges,
482 std::vector<TransferDesc::FieldInfo> &src_fields) = 0;
483
484 virtual RegionInstance get_pointer_instance(void) const = 0;
485
486 virtual const std::vector<RegionInstance> *get_instances(void) const = 0;
487
488 virtual FieldID get_field(void) const = 0;
489
491
493 Memory addrs_mem, RegionInstance inst, const std::vector<FieldID> &fields,
494 const std::vector<size_t> &fld_offsets, const std::vector<size_t> &fld_sizes,
495 Channel *channel = nullptr) const = 0;
496
497 virtual void print(std::ostream &os) const = 0;
498 };
499
500 std::ostream &operator<<(std::ostream &os, const IndirectionInfo &ii);
501
503 public:
504 IndirectionInfoBase(bool _structured, FieldID _field_id, RegionInstance _inst,
505 bool _is_ranges, bool _oor_possible, bool _aliasing_possible,
506 size_t _subfield_offset, const std::vector<RegionInstance> _insts,
507 Channel *_addrsplit_channel);
508
509 protected:
510 // most of the logic to generate unstructured gather/scatter paths is
511 // dimension-agnostic and we can define it in a base class to save
512 // compile time/code size ...
513 virtual void generate_gather_paths(const Node *nodes_info, Memory dst_mem,
515 unsigned indirect_idx, unsigned src_fld_start,
516 unsigned src_fld_count, size_t bytes_per_element,
517 CustomSerdezID serdez_id,
518 std::vector<TransferGraph::XDTemplate> &xd_nodes,
519 std::vector<TransferGraph::IBInfo> &ib_edges,
520 std::vector<TransferDesc::FieldInfo> &src_fields);
521
522 virtual void generate_scatter_paths(Memory src_mem,
524 unsigned indirect_idx, unsigned dst_fld_start,
525 unsigned dst_fld_count, size_t bytes_per_element,
526 CustomSerdezID serdez_id,
527 std::vector<TransferGraph::XDTemplate> &xd_nodes,
528 std::vector<TransferGraph::IBInfo> &ib_edges,
529 std::vector<TransferDesc::FieldInfo> &src_fields);
530
531 // ... but we need three helpers that will be defined in the typed versions
532 virtual size_t num_spaces() const = 0;
533 virtual void populate_copy_info(ChannelCopyInfo &info) const = 0;
534 virtual size_t domain_size() const = 0;
535 virtual size_t address_size() const = 0;
536
537 virtual XferDesFactory *create_addrsplit_factory(size_t bytes_per_element) const = 0;
538
546 std::vector<RegionInstance> insts;
548 };
549
551 //
552 // class IndirectionInfoTyped<N,T,N2,T2>
553 //
554
555 template <int N, typename T, int N2, typename T2>
557 public:
559 const IndexSpace<N, T> &is,
560 const typename CopyIndirection<N, T>::template Unstructured<N2, T2> &ind,
561 Channel *_addr_split_channel);
562
563 virtual Event request_metadata(void);
564
566
567 virtual const std::vector<RegionInstance> *get_instances(void) const;
568
569 virtual FieldID get_field(void) const;
570
572
574 Memory addrs_mem, RegionInstance inst, const std::vector<FieldID> &fields,
575 const std::vector<size_t> &fld_offsets, const std::vector<size_t> &fld_sizes,
576 Channel *channel = nullptr) const;
577
578 virtual void print(std::ostream &os) const;
579
580 protected:
581 virtual size_t num_spaces() const;
582 virtual void populate_copy_info(ChannelCopyInfo &info) const;
583 virtual size_t domain_size() const;
584 virtual size_t address_size() const;
585
586 virtual XferDesFactory *create_addrsplit_factory(size_t bytes_per_element) const;
587
589 std::vector<IndexSpace<N2, T2>> spaces;
591 };
592
593 // a TransferOperation is an application-requested copy/fill/reduce
595 public:
596 TransferOperation(TransferDesc &_desc, Event _precondition,
597 GenEventImpl *_finish_event, EventImpl::gen_t _finish_gen,
598 int priority);
599
601
602 virtual void print(std::ostream &os) const;
603
604 void start_or_defer(void);
605
606 virtual bool mark_ready(void);
607 virtual bool mark_started(void);
608
611
612 void notify_ib_allocation(unsigned ib_index, off_t ib_offset);
613 void notify_ib_allocations(unsigned count, unsigned first_index,
614 const off_t *offsets);
616
618 public:
620 virtual void request_cancellation(void);
621 virtual void print(std::ostream &os) const;
622
623 protected:
625 };
626
627 protected:
628 virtual void mark_completed(void);
629
630 class DeferredStart : public EventWaiter {
631 public:
633 virtual void event_triggered(bool poisoned, TimeLimit work_until);
634 virtual void print(std::ostream &os) const;
635 virtual Event get_finish_event(void) const;
636
639 };
641
644 std::vector<XferDesID> xd_ids;
645 std::vector<XDLifetimeTracker *> xd_trackers;
646 std::vector<off_t> ib_offsets;
649 };
650
651 template <int N, typename T>
653 Event (*)(const IndexSpace<N, T> &, const std::vector<CopySrcDstField> &,
654 const std::vector<CopySrcDstField> &,
655 const std::vector<const typename CopyIndirection<N, T>::Base *> &,
656 const Realm::ProfilingRequestSet &, Event, int);
657
658 template <int N, typename T>
661 };
662
663}; // namespace Realm
664
665#include "realm/transfer/transfer.inl"
666
667#endif // ifndef REALM_TRANSFER_H
Definition address_list.h:55
Definition channel.h:713
Definition indexspace.h:252
Definition indexspace.h:250
unsigned gen_t
Definition event_impl.h:87
Definition event_impl.h:49
Definition event.h:50
Definition event_impl.h:198
Definition transfer.h:502
bool structured
Definition transfer.h:539
virtual XferDesFactory * create_addrsplit_factory(size_t bytes_per_element) const =0
virtual void generate_scatter_paths(Memory src_mem, TransferGraph::XDTemplate::IO src_edge, unsigned indirect_idx, unsigned dst_fld_start, unsigned dst_fld_count, size_t bytes_per_element, CustomSerdezID serdez_id, std::vector< TransferGraph::XDTemplate > &xd_nodes, std::vector< TransferGraph::IBInfo > &ib_edges, std::vector< TransferDesc::FieldInfo > &src_fields)
virtual void generate_gather_paths(const Node *nodes_info, Memory dst_mem, TransferGraph::XDTemplate::IO dst_edge, unsigned indirect_idx, unsigned src_fld_start, unsigned src_fld_count, size_t bytes_per_element, CustomSerdezID serdez_id, std::vector< TransferGraph::XDTemplate > &xd_nodes, std::vector< TransferGraph::IBInfo > &ib_edges, std::vector< TransferDesc::FieldInfo > &src_fields)
std::vector< RegionInstance > insts
Definition transfer.h:546
size_t subfield_offset
Definition transfer.h:545
FieldID field_id
Definition transfer.h:540
IndirectionInfoBase(bool _structured, FieldID _field_id, RegionInstance _inst, bool _is_ranges, bool _oor_possible, bool _aliasing_possible, size_t _subfield_offset, const std::vector< RegionInstance > _insts, Channel *_addrsplit_channel)
RegionInstance inst
Definition transfer.h:541
bool oor_possible
Definition transfer.h:543
bool aliasing_possible
Definition transfer.h:544
Channel * addrsplit_channel
Definition transfer.h:547
virtual size_t num_spaces() const =0
bool is_ranges
Definition transfer.h:542
virtual size_t address_size() const =0
virtual void populate_copy_info(ChannelCopyInfo &info) const =0
virtual size_t domain_size() const =0
Definition transfer.h:556
virtual RegionInstance get_pointer_instance(void) const
virtual void populate_copy_info(ChannelCopyInfo &info) const
IndexSpace< N, T > domain
Definition transfer.h:588
virtual void print(std::ostream &os) const
IndirectionInfoTyped(const IndexSpace< N, T > &is, const typename CopyIndirection< N, T >::template Unstructured< N2, T2 > &ind, Channel *_addr_split_channel)
virtual const std::vector< RegionInstance > * get_instances(void) const
virtual size_t domain_size() const
virtual Event request_metadata(void)
virtual TransferIterator * create_indirect_iterator(Memory addrs_mem, RegionInstance inst, const std::vector< FieldID > &fields, const std::vector< size_t > &fld_offsets, const std::vector< size_t > &fld_sizes, Channel *channel=nullptr) const
Channel * addr_split_channel
Definition transfer.h:590
virtual TransferIterator * create_address_iterator(RegionInstance peer) const
virtual size_t address_size() const
virtual XferDesFactory * create_addrsplit_factory(size_t bytes_per_element) const
std::vector< IndexSpace< N2, T2 > > spaces
Definition transfer.h:589
virtual size_t num_spaces() const
virtual FieldID get_field(void) const
Definition transfer.h:463
virtual FieldID get_field(void) const =0
virtual void generate_gather_paths(const Node *node_info, Memory dst_mem, TransferGraph::XDTemplate::IO dst_edge, unsigned indirect_idx, unsigned src_fld_start, unsigned src_fld_count, size_t bytes_per_element, CustomSerdezID serdez_id, std::vector< TransferGraph::XDTemplate > &xd_nodes, std::vector< TransferGraph::IBInfo > &ib_edges, std::vector< TransferDesc::FieldInfo > &src_fields)=0
virtual void generate_scatter_paths(Memory src_mem, TransferGraph::XDTemplate::IO src_edge, unsigned indirect_idx, unsigned dst_fld_start, unsigned dst_fld_count, size_t bytes_per_element, CustomSerdezID serdez_id, std::vector< TransferGraph::XDTemplate > &xd_nodes, std::vector< TransferGraph::IBInfo > &ib_edges, std::vector< TransferDesc::FieldInfo > &src_fields)=0
virtual Event request_metadata(void)=0
virtual const std::vector< RegionInstance > * get_instances(void) const =0
virtual RegionInstance get_pointer_instance(void) const =0
virtual TransferIterator * create_indirect_iterator(Memory addrs_mem, RegionInstance inst, const std::vector< FieldID > &fields, const std::vector< size_t > &fld_offsets, const std::vector< size_t > &fld_sizes, Channel *channel=nullptr) const =0
virtual TransferIterator * create_address_iterator(RegionInstance peer) const =0
virtual void print(std::ostream &os) const =0
virtual ~IndirectionInfo(void)
Definition transfer.h:465
Definition inst_layout.h:266
Definition memory.h:33
static const Memory NO_MEMORY
Definition memory.h:49
Definition operation.h:75
Definition operation.h:32
Definition profiling.h:363
Definition inst_impl.h:54
Definition instance.h:66
Definition sparsity_impl.h:105
Definition timers.h:129
Definition transfer.h:431
virtual void print(std::ostream &os) const
TransferDesc * desc
Definition transfer.h:438
virtual void event_triggered(bool poisoned, TimeLimit work_until)
Event precondition
Definition transfer.h:439
virtual Event get_finish_event(void) const
DeferredAnalysis(TransferDesc *_desc)
Definition transfer.h:379
TransferDomain * domain
Definition transfer.h:445
atomic< bool > analysis_complete
Definition transfer.h:451
void cancel_analysis(Event failed_precondition)
ProfilingMeasurements::OperationMemoryUsage prof_usage
Definition transfer.h:459
size_t fill_size
Definition transfer.h:458
std::vector< FieldInfo > src_fields
Definition transfer.h:456
TransferGraph graph
Definition transfer.h:454
std::vector< IndirectionInfo * > indirects
Definition transfer.h:447
Mutex mutex
Definition transfer.h:450
bool request_analysis(TransferOperation *op)
std::vector< CopySrcDstField > dsts
Definition transfer.h:446
std::vector< CopySrcDstField > srcs
Definition transfer.h:446
DeferredAnalysis deferred_analysis
Definition transfer.h:441
ProfilingMeasurements::OperationCopyInfo prof_cpinfo
Definition transfer.h:460
std::vector< int > dim_order
Definition transfer.h:455
void check_analysis_preconditions()
std::vector< FieldInfo > dst_fields
Definition transfer.h:456
bool analysis_successful
Definition transfer.h:452
atomic< int > refcount
Definition transfer.h:425
void * fill_data
Definition transfer.h:457
TransferDesc(IndexSpace< N, T > _is, std::vector< CopySrcDstField > &&_srcs, std::vector< CopySrcDstField > &&_dsts, const std::vector< const typename CopyIndirection< N, T >::Base * > &_indirects, const ProfilingRequestSet &requests)
ProfilingRequestSet prs
Definition transfer.h:448
TransferDesc(IndexSpace< N, T > _is, const std::vector< CopySrcDstField > &_srcs, const std::vector< CopySrcDstField > &_dsts, const std::vector< const typename CopyIndirection< N, T >::Base * > &_indirects, const ProfilingRequestSet &requests)
std::vector< TransferOperation * > pending_ops
Definition transfer.h:453
Definition transfer.h:266
virtual TransferIterator * create_iterator(RegionInstance inst, RegionInstance peer, const std::vector< FieldID > &fields, const std::vector< size_t > &fld_offsets, const std::vector< size_t > &fld_sizes) const =0
virtual ~TransferDomain(void)
virtual size_t volume(void) const =0
virtual TransferDomain * clone(void) const =0
virtual Event request_metadata(void)=0
virtual void choose_dim_order(std::vector< int > &dim_order, const std::vector< CopySrcDstField > &srcs, const std::vector< CopySrcDstField > &dsts, const std::vector< IndirectionInfo * > &indirects, bool force_fortran_order, size_t max_stride) const =0
virtual TransferIterator * create_iterator(RegionInstance inst, const std::vector< int > &dim_order, const std::vector< FieldID > &fields, const std::vector< size_t > &fld_offsets, const std::vector< size_t > &fld_sizes) const =0
virtual void count_fragments(RegionInstance inst, const std::vector< int > &dim_order, const std::vector< FieldID > &fields, const std::vector< size_t > &fld_sizes, std::vector< size_t > &fragments) const =0
virtual bool empty(void) const =0
static TransferDomain * deserialize_new(S &deserializer)
static TransferDomain * construct(const IndexSpace< N, T > &is)
virtual void print(std::ostream &os) const =0
Definition transfer.h:125
Rect< N, T > cur_rect
Definition transfer.h:153
virtual Event request_metadata(void)
size_t cur_field_offset
Definition transfer.h:155
bool have_rect
Definition transfer.h:152
virtual void cancel_step(void)
Point< N, T > cur_point
Definition transfer.h:156
virtual void confirm_step(void)
virtual bool done(void)
bool carry
Definition transfer.h:157
virtual size_t step(size_t max_bytes, AddressInfo &info, unsigned flags, bool tentative=false)
bool tentative_valid
Definition transfer.h:162
Point< N, T > next_point
Definition transfer.h:156
TransferIteratorBase(RegionInstanceImpl *_inst_impl, const int _dim_order[N])
FieldID cur_field_id
Definition transfer.h:154
virtual bool get_addresses(AddressList &addrlist, const InstanceLayoutPieceBase *&nonaffine)
bool is_done
Definition transfer.h:152
virtual size_t get_base_offset(void) const
size_t inst_offset
Definition transfer.h:161
size_t cur_field_size
Definition transfer.h:155
virtual size_t step_custom(size_t max_bytes, AddressInfoCustom &info, bool tentative=false)
int dim_order[N]
Definition transfer.h:163
virtual bool get_next_rect(Rect< N, T > &r, FieldID &fid, size_t &offset, size_t &fsize)=0
RegionInstanceImpl * inst_impl
Definition transfer.h:159
virtual void reset(void)
Definition transfer.h:172
virtual bool get_next_rect(Rect< N, T > &r, FieldID &fid, size_t &offset, size_t &fsize)
size_t field_idx
Definition transfer.h:217
IndexSpace< N, T > is
Definition transfer.h:211
TransferIteratorIndexSpace(const int _dim_order[N], const std::vector< FieldID > &_fields, const std::vector< size_t > &_fld_offsets, const std::vector< size_t > &_fld_sizes, RegionInstanceImpl *_inst_impl, const IndexSpace< N, T > &_is)
std::vector< FieldID > fields
Definition transfer.h:215
static Serialization::PolymorphicSerdezSubclass< TransferIterator, TransferIteratorIndexSpace< N, T > > serdez_subclass
Definition transfer.h:201
std::vector< size_t > fld_sizes
Definition transfer.h:216
static TransferIterator * deserialize_new(S &deserializer)
TransferIteratorIndexSpace(const int _dim_order[N], const std::vector< FieldID > &_fields, const std::vector< size_t > &_fld_offsets, const std::vector< size_t > &_fld_sizes, RegionInstanceImpl *_inst_impl, const Rect< N, T > &_bounds, SparsityMapImpl< N, T > *_sparsity_impl)
SparsityMapImpl< N, T > * sparsity_impl
Definition transfer.h:212
bool iter_init_deferred
Definition transfer.h:214
std::vector< size_t > fld_offsets
Definition transfer.h:216
IndexSpaceIterator< N, T > iter
Definition transfer.h:213
bool serialize(S &serializer) const
virtual Event request_metadata(void)
Definition transfer.h:221
Memory addrs_mem
Definition transfer.h:254
int indirect_port_idx
Definition transfer.h:263
virtual bool get_next_rect(Rect< N, T > &r, FieldID &fid, size_t &offset, size_t &fsize)
bool can_merge
Definition transfer.h:256
std::vector< size_t > fld_offsets
Definition transfer.h:261
intptr_t addrs_mem_base
Definition transfer.h:255
TransferIteratorIndirect(Memory _addrs_mem, RegionInstanceImpl *_inst_impl, const std::vector< FieldID > &_fields, const std::vector< size_t > &_fld_offsets, const std::vector< size_t > &_fld_sizes)
virtual void set_indirect_input_port(XferDes *xd, int port_idx, TransferIterator *inner_iter)
bool serialize(S &serializer) const
XferDes * indirect_xd
Definition transfer.h:262
static constexpr size_t MAX_POINTS
Definition transfer.h:257
std::vector< size_t > fld_sizes
Definition transfer.h:261
virtual Event request_metadata(void)
size_t num_points
Definition transfer.h:259
Point< N, T > points[MAX_POINTS]
Definition transfer.h:258
size_t point_pos
Definition transfer.h:259
virtual ~TransferIteratorIndirect(void)
TransferIterator * addrs_in
Definition transfer.h:253
static TransferIterator * deserialize_new(S &deserializer)
static Serialization::PolymorphicSerdezSubclass< TransferIterator, TransferIteratorIndirect< N, T > > serdez_subclass
Definition transfer.h:244
std::vector< FieldID > fields
Definition transfer.h:260
virtual ~AddressInfoCustom()
Definition transfer.h:91
virtual int set_rect(const RegionInstanceImpl *inst, const InstanceLayoutPieceBase *piece, size_t field_size, size_t field_offset, int ndims, const int64_t lo[], const int64_t hi[], const int order[])=0
Definition transfer.h:41
virtual size_t get_address_size(void) const
virtual void reset(void)=0
virtual ~TransferIterator(void)
virtual bool done(void)=0
virtual size_t step_custom(size_t max_bytes, AddressInfoCustom &info, bool tentative=false)=0
virtual size_t get_base_offset(void) const
virtual size_t step(size_t max_bytes, AddressInfo &info, unsigned flags, bool tentative=false)=0
@ SRC_LINES_OK
Definition transfer.h:64
@ SRC_PARTIAL_OK
Definition transfer.h:63
@ SRC_PLANES_OK
Definition transfer.h:65
@ SRC_FLAGMASK
Definition transfer.h:66
@ PARTIAL_OK
Definition transfer.h:73
@ LINES_OK
Definition transfer.h:74
@ PLANES_OK
Definition transfer.h:75
@ DST_FLAGMASK
Definition transfer.h:71
@ DST_LINES_OK
Definition transfer.h:69
@ DST_PARTIAL_OK
Definition transfer.h:68
@ DST_PLANES_OK
Definition transfer.h:70
virtual Event request_metadata(void)
virtual bool get_addresses(AddressList &addrlist, const InstanceLayoutPieceBase *&nonaffine)=0
static TransferIterator * deserialize_new(S &deserializer)
virtual void cancel_step(void)=0
virtual void confirm_step(void)=0
virtual void set_indirect_input_port(XferDes *xd, int port_idx, TransferIterator *inner_iter)
TransferOperation * op
Definition transfer.h:637
Event precondition
Definition transfer.h:638
virtual Event get_finish_event(void) const
virtual void event_triggered(bool poisoned, TimeLimit work_until)
virtual void print(std::ostream &os) const
DeferredStart(TransferOperation *_op)
XDLifetimeTracker(TransferOperation *_op, XferDesID _xd_id)
XferDesID xd_id
Definition transfer.h:624
virtual void print(std::ostream &os) const
Definition transfer.h:594
std::vector< off_t > ib_offsets
Definition transfer.h:646
Event precondition
Definition transfer.h:643
TransferOperation(TransferDesc &_desc, Event _precondition, GenEventImpl *_finish_event, EventImpl::gen_t _finish_gen, int priority)
atomic< unsigned > ib_responses_needed
Definition transfer.h:647
DeferredStart deferred_start
Definition transfer.h:640
TransferDesc & desc
Definition transfer.h:642
std::vector< XDLifetimeTracker * > xd_trackers
Definition transfer.h:645
void notify_ib_allocations(unsigned count, unsigned first_index, const off_t *offsets)
virtual bool mark_ready(void)
void notify_xd_completion(XferDesID xd_id)
virtual void mark_completed(void)
virtual void print(std::ostream &os) const
virtual bool mark_started(void)
std::vector< XferDesID > xd_ids
Definition transfer.h:644
void notify_ib_allocation(unsigned ib_index, off_t ib_offset)
int priority
Definition transfer.h:648
Definition mutex.h:223
Definition channel.h:633
Definition channel.h:286
Definition atomics.h:31
Definition activemsg.h:38
Event(*)(const IndexSpace< N, T > &, const std::vector< CopySrcDstField > &, const std::vector< CopySrcDstField > &, const std::vector< const typename CopyIndirection< N, T >::Base * > &, const Realm::ProfilingRequestSet &, Event, int) CopyImplFn
Definition transfer.h:656
realm_field_id_t FieldID
Definition instance.h:45
int NodeID
Definition nodeset.h:40
int CustomSerdezID
Definition custom_serdez.h:148
unsigned long long XferDesID
Definition channel.h:57
std::ostream & operator<<(std::ostream &os, const DenseRectangleList< N, T > &drl)
Definition channel.h:684
Definition transfer.h:659
static CopyImplFn< N, T > impl
Definition transfer.h:660
Definition indexspace.h:1249
Definition indexspace.h:323
Definition runtime_impl.h:88
Definition point.h:55
Definition point.h:143
Definition transfer.h:418
size_t size
Definition transfer.h:420
size_t offset
Definition transfer.h:420
CustomSerdezID serdez_id
Definition transfer.h:421
FieldID id
Definition transfer.h:419
Definition transfer.h:370
size_t size
Definition transfer.h:372
Memory memory
Definition transfer.h:371
Definition transfer.h:335
unsigned fill_size
Definition transfer.h:353
RegionInstance inst
Definition transfer.h:339
unsigned fld_start
Definition transfer.h:340
unsigned port
Definition transfer.h:345
unsigned ind_idx
Definition transfer.h:344
unsigned fill_start
Definition transfer.h:352
struct Realm::TransferGraph::XDTemplate::IO::@36::@40 fill
IOType iotype
Definition transfer.h:336
unsigned fld_count
Definition transfer.h:341
struct Realm::TransferGraph::XDTemplate::IO::@36::@39 indirect
unsigned edge
Definition transfer.h:350
size_t fill_total
Definition transfer.h:354
Definition transfer.h:318
Channel * channel
Definition transfer.h:326
static IO mk_fill(unsigned _fill_start, unsigned _fill_size, size_t _fill_total)
void set_simple(Channel *channel, int in_edge, int out_edge)
int scatter_control_input
Definition transfer.h:324
static IO mk_edge(unsigned _edge)
int gather_control_input
Definition transfer.h:323
XferDesRedopInfo redop
Definition transfer.h:325
XferDesFactory * factory
Definition transfer.h:322
static IO mk_inst(RegionInstance _inst, unsigned _fld_start, unsigned _fld_count)
std::vector< IO > inputs
Definition transfer.h:364
std::vector< IO > outputs
Definition transfer.h:365
static IO mk_indirect(unsigned _ind_idx, unsigned _port, RegionInstance _inst, unsigned _fld_start, unsigned _fld_count)
NodeID target_node
Definition transfer.h:320
IOType
Definition transfer.h:329
@ IO_INDIRECT_INST
Definition transfer.h:331
@ IO_FILL_DATA
Definition transfer.h:333
@ IO_EDGE
Definition transfer.h:332
@ IO_INST
Definition transfer.h:330
Definition transfer.h:317
std::vector< IBInfo > ib_edges
Definition transfer.h:375
std::vector< XDTemplate > xd_nodes
Definition transfer.h:374
std::vector< unsigned > ib_alloc_order
Definition transfer.h:376
Definition transfer.h:78
size_t num_planes
Definition transfer.h:83
size_t line_stride
Definition transfer.h:82
size_t bytes_per_chunk
Definition transfer.h:80
size_t base_offset
Definition transfer.h:79
size_t num_lines
Definition transfer.h:81
size_t plane_stride
Definition transfer.h:84
Definition channel.h:210