doc/main/processor_8h_source.html

/*

 * Copyright 2025 Stanford University, NVIDIA Corporation

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *     http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


// processors for Realm


#ifndef REALM_PROCESSOR_H

#define REALM_PROCESSOR_H


#include "realm/realm_c.h"


#include "realm/event.h"


#include <vector>

#include <map>


namespace Realm {


  typedef ::realm_address_space_t AddressSpace;


  class ProfilingRequestSet;

  class CodeDescriptor;


  class REALM_PUBLIC_API Processor {

  public:

    typedef ::realm_id_t id_t;


    id_t id{REALM_NO_PROC};


    Processor() = default;


    constexpr explicit Processor(id_t id)

      : id(id)

    {}


    constexpr operator id_t() const { return id; }


    bool operator<(const Processor &rhs) const { return id < rhs.id; }

    bool operator==(const Processor &rhs) const { return id == rhs.id; }

    bool operator!=(const Processor &rhs) const { return id != rhs.id; }


    static const Processor NO_PROC;


    bool exists(void) const { return id != 0; }


    typedef ::realm_task_func_id_t TaskFuncID;

    typedef void (*TaskFuncPtr)(const void *args, size_t arglen, const void *user_data,

                                size_t user_data_len, Processor proc);


    // Different Processor types (defined in realm_c.h)

    // can't just typedef the kind because of C/C++ enum scope rules


    enum Kind

    {

#define C_ENUMS(name, desc) name,

      REALM_PROCESSOR_KINDS(C_ENUMS)

#undef C_ENUMS

    };


    // Return what kind of processor this is

    Kind kind(void) const;

    // Return the address space for this processor

    AddressSpace address_space(void) const;


    REALM_ATTR_DEPRECATED(

        "use ProcessorGroup::create_group instead",

        static Processor create_group(const span<const Processor> &members));


    void get_group_members(Processor *member_list, size_t &num_members) const;

    void get_group_members(std::vector<Processor> &member_list) const;


    int get_num_cores(void) const;


    // special task IDs

    enum

    {

      // Save ID 0 for the force shutdown function

      TASK_ID_PROCESSOR_NOP = REALM_TASK_ID_PROCESSOR_NOP,

      TASK_ID_PROCESSOR_INIT = REALM_TASK_ID_PROCESSOR_INIT,

      TASK_ID_PROCESSOR_SHUTDOWN = REALM_TASK_ID_PROCESSOR_SHUTDOWN,

      TASK_ID_FIRST_AVAILABLE = REALM_TASK_ID_FIRST_AVAILABLE,

    };


    Event spawn(TaskFuncID func_id, const void *args, size_t arglen,

                Event wait_on = Event::NO_EVENT, int priority = 0) const;


    // Same as the above but with requests for profiling

    Event spawn(TaskFuncID func_id, const void *args, size_t arglen,

                const ProfilingRequestSet &requests, Event wait_on = Event::NO_EVENT,

                int priority = 0) const;


    static Processor get_executing_processor(void);


    // changes the priority of the currently running task

    static void set_current_task_priority(int new_priority);


    // returns the finish event for the currently running task

    static Event get_current_finish_event(void);


    // Add an event that must be a precondition for triggering

    // the finish event for the currently running task. This allows

    // for other asynchronous effects from the task to be accumulated

    // into finish event dynamically and for the task to exit without

    // needing to block and wait for these events to trigger.

    static realm_status_t add_finish_event_precondition(Event precondition);


    // a scheduler lock prevents the current thread from releasing its

    //  execution resources even when waiting on an Event - multiple

    //  nested calls to 'enable_scheduler_lock' are permitted, but a

    //  matching number of calls to 'disable_scheduler_lock' are required

    static void enable_scheduler_lock(void);

    static void disable_scheduler_lock(void);


    // dynamic task registration - this may be done for:

    //  1) a specific processor/group (anywhere in the system)

    //  2) for all processors of a given type, either in the local address space/process,

    //       or globally

    //

    // in both cases, an Event is returned, and any tasks launched that expect to use the

    //  newly-registered task IDs must include that event as a precondition


    Event register_task(TaskFuncID func_id, const CodeDescriptor &codedesc,

                        const ProfilingRequestSet &prs, const void *user_data = 0,

                        size_t user_data_len = 0) const;


    static Event register_task_by_kind(Kind target_kind, bool global, TaskFuncID func_id,

                                       const CodeDescriptor &codedesc,

                                       const ProfilingRequestSet &prs,

                                       const void *user_data = 0,

                                       size_t user_data_len = 0);


    // reports an execution fault in the currently running task

    static void report_execution_fault(int reason, const void *reason_data,

                                       size_t reason_size);


    // reports a problem with a processor in general (this is primarily for fault

    // injection)

    void report_processor_fault(int reason, const void *reason_data,

                                size_t reason_size) const;


    static const char *get_kind_name(Kind kind);


#ifdef REALM_USE_KOKKOS

    // Kokkos execution policies will accept an "execution instance" to

    //  capture task parallelism - provide those here

    class KokkosExecInstance;


    KokkosExecInstance kokkos_work_space(void) const;

#endif

  };


#if defined(REALM_USE_KOKKOS)

  // Kokkos defines this but we can't use it :(

  template <typename T>

  class is_kokkos_execution_space {

    typedef char yes;

    typedef long no;


    template <typename C>

    static yes check(typename C::execution_space *);

    template <typename C>

    static no check(...);


  public:

    static constexpr bool value = sizeof(check<T>(0)) == sizeof(yes);

  };


  class REALM_PUBLIC_API Processor::KokkosExecInstance {

  public:

    KokkosExecInstance(Processor _p);


    // template-fu will type-check a coercion to any Kokkos execution

    //  space type - runtime will verify a valid type was requested

    template <typename exec_space,

              typename std::enable_if<is_kokkos_execution_space<exec_space>::value,

                                      int>::type = 0>

    operator exec_space() const;


  protected:

    Processor p;

  };

#endif


  // a processor group is a set of processors that share a ready task queue

  //  (in addition to their own processor-specific task queues)

  // NOTE: processor groups are currently limited to include processors from

  //  only a single node/rank in a distributed setting


  class REALM_PUBLIC_API ProcessorGroup : public Processor {

  public:

    static ProcessorGroup create_group(const Processor *members, size_t num_members);


    static ProcessorGroup create_group(const span<const Processor> &members)

    {

      return create_group(members.data(), members.size());

    }


    void destroy(Event wait_on = Event::NO_EVENT) const;


    static const ProcessorGroup NO_PROC_GROUP;

  };


}; // namespace Realm


#include "realm/processor.inl"


#endif // ifndef REALM_PROCESSOR_H

Realm::CodeDescriptor
Definition codedesc.h:249

Realm::Event
Definition event.h:50

Realm::ProcessorGroup
Definition processor.h:199

Realm::ProcessorGroup::destroy
void destroy(Event wait_on=Event::NO_EVENT) const

Realm::ProcessorGroup::NO_PROC_GROUP
static const ProcessorGroup NO_PROC_GROUP
Definition processor.h:210

Realm::ProcessorGroup::create_group
static ProcessorGroup create_group(const span< const Processor > &members)
Definition processor.h:204

Realm::ProcessorGroup::create_group
static ProcessorGroup create_group(const Processor *members, size_t num_members)

Realm::Processor
Definition processor.h:37

Realm::Processor::operator==
bool operator==(const Processor &rhs) const
Definition processor.h:51

Realm::Processor::get_group_members
void get_group_members(std::vector< Processor > &member_list) const

Realm::Processor::id
id_t id
Definition processor.h:41

Realm::Processor::Processor
constexpr Processor(id_t id)
Definition processor.h:44

Realm::Processor::exists
bool exists(void) const
Definition processor.h:56

Realm::Processor::get_group_members
void get_group_members(Processor *member_list, size_t &num_members) const

Realm::Processor::REALM_ATTR_DEPRECATED
REALM_ATTR_DEPRECATED("use ProcessorGroup::create_group instead", static Processor create_group(const span< const Processor > &members))

Realm::Processor::get_executing_processor
static Processor get_executing_processor(void)

Realm::Processor::get_kind_name
static const char * get_kind_name(Kind kind)

Realm::Processor::id_t
::realm_id_t id_t
Definition processor.h:39

Realm::Processor::spawn
Event spawn(TaskFuncID func_id, const void *args, size_t arglen, const ProfilingRequestSet &requests, Event wait_on=Event::NO_EVENT, int priority=0) const

Realm::Processor::register_task
Event register_task(TaskFuncID func_id, const CodeDescriptor &codedesc, const ProfilingRequestSet &prs, const void *user_data=0, size_t user_data_len=0) const

Realm::Processor::report_execution_fault
static void report_execution_fault(int reason, const void *reason_data, size_t reason_size)

Realm::Processor::Kind
Kind
Definition processor.h:65

Realm::Processor::get_num_cores
int get_num_cores(void) const

Realm::Processor::report_processor_fault
void report_processor_fault(int reason, const void *reason_data, size_t reason_size) const

Realm::Processor::register_task_by_kind
static Event register_task_by_kind(Kind target_kind, bool global, TaskFuncID func_id, const CodeDescriptor &codedesc, const ProfilingRequestSet &prs, const void *user_data=0, size_t user_data_len=0)

Realm::Processor::disable_scheduler_lock
static void disable_scheduler_lock(void)

Realm::Processor::enable_scheduler_lock
static void enable_scheduler_lock(void)

Realm::Processor::spawn
Event spawn(TaskFuncID func_id, const void *args, size_t arglen, Event wait_on=Event::NO_EVENT, int priority=0) const

Realm::Processor::add_finish_event_precondition
static realm_status_t add_finish_event_precondition(Event precondition)

Realm::Processor::operator<
bool operator<(const Processor &rhs) const
Definition processor.h:50

Realm::Processor::TaskFuncID
::realm_task_func_id_t TaskFuncID
Definition processor.h:58

Realm::Processor::get_current_finish_event
static Event get_current_finish_event(void)

Realm::Processor::NO_PROC
static const Processor NO_PROC
Definition processor.h:54

Realm::Processor::address_space
AddressSpace address_space(void) const

Realm::Processor::Processor
Processor()=default

Realm::Processor::set_current_task_priority
static void set_current_task_priority(int new_priority)

Realm::Processor::operator!=
bool operator!=(const Processor &rhs) const
Definition processor.h:52

Realm::Processor::kind
Kind kind(void) const

Realm::ProfilingRequestSet
Definition profiling.h:363

Realm::span
Definition utils.h:84

REALM_PUBLIC_API
#define REALM_PUBLIC_API
Definition compiler_support.h:217

event.h

C_ENUMS
#define C_ENUMS(name, desc)
Definition memory.h:60

Realm
Definition activemsg.h:38

Realm::AddressSpace
::realm_address_space_t AddressSpace
Definition memory.h:31

realm_c.h

REALM_TASK_ID_FIRST_AVAILABLE
#define REALM_TASK_ID_FIRST_AVAILABLE
Definition realm_c.h:174

realm_status_t
enum realm_status_enum realm_status_t

realm_id_t
unsigned long long realm_id_t
Definition realm_c.h:64

REALM_TASK_ID_PROCESSOR_NOP
#define REALM_TASK_ID_PROCESSOR_NOP
Definition realm_c.h:171

REALM_TASK_ID_PROCESSOR_INIT
#define REALM_TASK_ID_PROCESSOR_INIT
Definition realm_c.h:172

REALM_PROCESSOR_KINDS
#define REALM_PROCESSOR_KINDS(__op__)
Definition realm_c.h:227

REALM_TASK_ID_PROCESSOR_SHUTDOWN
#define REALM_TASK_ID_PROCESSOR_SHUTDOWN
Definition realm_c.h:173

realm_address_space_t
unsigned int realm_address_space_t
Definition realm_c.h:72

realm_task_func_id_t
unsigned realm_task_func_id_t
Definition realm_c.h:73

REALM_NO_PROC
#define REALM_NO_PROC
Definition realm_c.h:165