|
| | GPUreduceXferDes (uintptr_t _dma_op, Channel *_channel, NodeID _launch_node, XferDesID _guid, const std::vector< XferDesPortInfo > &inputs_info, const std::vector< XferDesPortInfo > &outputs_info, int _priority, XferDesRedopInfo _redop_info) |
| |
| long | get_requests (Request **requests, long nr) |
| |
| bool | progress_xd (GPUreduceChannel *channel, TimeLimit work_until) |
| |
| bool | fast_reduction_kernel_mode (GPUreduceChannel *channel, const size_t max_bytes, XferPort *in_port, XferPort *out_port, const size_t in_span_start, const size_t out_span_start) |
| |
| void | setup_redop_kernel (GPUreduceChannel *channel, void *params, const size_t in_span_start, const size_t out_span_start, const size_t in_elem_size, const size_t out_elem_size, const size_t elems, const bool has_transpose) |
| |
| void | record_redop_advanced_kernel (GPU *gpu) |
| |
| KernelVariantDesc | describe_kernel_variant (GPU *cpu, bool is_advanced) |
| |
| bool | resolve_kernel_slot (GPU *gpu, void *host_proxy, CUfunction &kernel_out, CUfunction GPU::GPUReductionOpEntry::*cache_field) |
| |
| | REALM_ALIGNED_TYPE_CONST (AlignedStorage, UnalignedStorage, 16) |
| |
| | REALM_PMTA_DEFN (XferDes, IntrusivePriorityListLink< XferDes >, xd_link) |
| |
| | REALM_PMTA_DEFN (XferDes, int, priority) |
| |
| | XferDes (uintptr_t _dma_op, Channel *_channel, NodeID _launch_node, XferDesID _guid, const std::vector< XferDesPortInfo > &inputs_info, const std::vector< XferDesPortInfo > &outputs_info, int _priority, const void *_fill_data, size_t fill_size) |
| |
| void | add_reference (void) |
| |
| void | remove_reference (void) |
| |
| void | add_update_pre_bytes_total_received (void) |
| |
| virtual Event | request_metadata () |
| |
| virtual void | notify_request_read_done (Request *req) |
| |
| virtual void | notify_request_write_done (Request *req) |
| |
| virtual void | flush () |
| |
| long | default_get_requests (Request **requests, long nr, unsigned flags=0) |
| |
| void | default_notify_request_read_done (Request *req) |
| |
| void | default_notify_request_write_done (Request *req) |
| |
| virtual void | update_bytes_read (int port_idx, size_t offset, size_t size) |
| |
| virtual void | update_bytes_write (int port_idx, size_t offset, size_t size) |
| |
| void | update_pre_bytes_write (int port_idx, size_t offset, size_t size) |
| |
| void | update_pre_bytes_total (int port_idx, size_t pre_bytes_total) |
| |
| void | update_next_bytes_read (int port_idx, size_t offset, size_t size) |
| |
| void | begin_completion () |
| |
| void | mark_completed () |
| |
| unsigned | current_progress (void) |
| |
| bool | check_for_progress (unsigned last_counter) |
| |
| void | update_progress (void) |
| |
| virtual bool | request_available () |
| |
| virtual Request * | dequeue_request () |
| |
| virtual void | enqueue_request (Request *req) |
| |
| size_t | update_control_info (ReadSequenceCache *rseqcache) |
| |
| size_t | get_addresses (size_t min_xfer_size, ReadSequenceCache *rseqcache) |
| |
| size_t | get_addresses (size_t min_xfer_size, ReadSequenceCache *rseqcache, const InstanceLayoutPieceBase *&in_nonaffine, const InstanceLayoutPieceBase *&out_nonaffine) |
| |
| bool | record_address_consumption (size_t total_read_bytes, size_t total_write_bytes) |
| |
| void | replicate_fill_data (size_t new_size) |
| |