Schedulers.Multicoremodule Backend : Ir.Backend_impl.For_add_schedulerinclude Ir.Backend_intf.Backend_device_common
with type optimize_ctx = Ir.Low_level.optimize_ctxinclude Ir.Backend_intf.Device
with type optimize_ctx = Ir.Low_level.optimize_ctxinclude Ir.Backend_intf.Device_types
with type optimize_ctx = Ir.Low_level.optimize_ctxinclude Ir.Backend_intf.Device_config
with type optimize_ctx = Ir.Low_level.optimize_ctxinclude Ir.Backend_intf.Device_config_commonval sexp_of_dev : dev -> Sexplib0.Sexp.tval sexp_of_runner : runner -> Sexplib0.Sexp.tAn event tracks if a device's runner finished computing past a particular point in its schedule. These values are used internally for scheduling across devices/queues of the backend, and can be used for explicit scheduling.
val sexp_of_event : event -> Sexplib0.Sexp.ttype optimize_ctx = Ir.Low_level.optimize_ctxThe optimization context for compiling code, in particular Low_level.optimize_ctx for low-level backends.
val sexp_of_optimize_ctx : optimize_ctx -> Sexplib0.Sexp.tval empty_optimize_ctx : Base.unit -> optimize_ctxtype nonrec device = (dev, runner, event) Ir.Backend_intf.deviceval sexp_of_device : device -> Sexplib0.Sexp.ttype nonrec context =
(dev, runner, event, optimize_ctx) Ir.Backend_intf.contextval sexp_of_context : context -> Sexplib0.Sexp.tinclude Ir.Backend_intf.Slab_alloc with type device := deviceval alloc_pool :
?mode:Ir.Tnode.memory_mode ->
device ->
pool_id:Base.int ->
size_in_bytes:Base.int ->
alignment:Base.int ->
Base.unitAllocates the slab for pool_id on device. The optional ?mode carries the tnode's memory mode so backends can pick a storage mode (Metal private vs. shared); backends that do not care ignore it.
val free_pool : (device -> pool_id:Base.int -> Base.unit) Base.optionFrees the slab for pool_id and drops its table entry. None for backends that rely on GC.
val memset_zero :
device ->
pool_id:Base.int ->
offset:Base.int ->
size_in_bytes:Base.int ->
Base.unitZero-initializes size_in_bytes at base_of pool_id + offset.
val make_context :
?ctx_buffers:Ir.Backend_intf.ctx_buffers ->
?optimize_ctx:optimize_ctx ->
device ->
contextReturns a context without a parent.
val make_child :
?ctx_buffers:Ir.Backend_intf.ctx_buffers ->
?optimize_ctx:optimize_ctx ->
?merge_buffer_node:Ir.Tnode.t Base.option ->
context ->
contextReturns a context with the same Backend_intf.context.device, Backend_intf.context.ctx_buffers, Backend_intf.context.optimize_ctx, Backend_intf.context.merge_buffer_node if omitted, as the given context's, which is also the Backend_intf.context.parent.
val get_name : device -> Base.stringval sync : event -> Base.unitBlocks till the event completes, if it's not done already.
It is rarely needed to call sync explicitly, because it should always be called internally when necessary, in particular before extracting values from host.
val is_done : event -> Base.boolWhether the event completed.
Schedules waiting for the given event on the context's device.
NOTE: it should rarely be needed to call will_wait_for explicitly, because it should always be called internally when necessary.
val get_used_memory : device -> Base.intReturns (an upper bound of) the memory used for arrays, in bytes.
Global debug information; backend-specific and might evolve independently on the backends.
val get_debug_info : device -> Base.Sexp.tPer-device debug information; backend-specific and might evolve independently on the backends
val await : device -> Base.unitBlocks till the device becomes idle, i.e. synchronizes the device's runner.
Returns the event indicating if any currently running or scheduled computations on the device have completed.
val is_idle : device -> Base.boolWhether the device's runner is currently waiting for work.
val get_device : ordinal:Base.int -> deviceAfter the stream-into-device fold there is one compute stream per device, so the device is its own single stream; new_stream returns the device unchanged. Retained for call-site compatibility (callers create a fresh context per logical stream via make_context).
include Ir.Backend_impl.Buffer with type buffer_ptr = Backend.buffer_ptrtype buffer_ptr = Backend.buffer_ptrval sexp_of_buffer_ptr : buffer_ptr -> Sexplib0.Sexp.tinclude sig ... endtype nonrec buffer = buffer_ptr Ir.Backend_impl.bufferval sexp_of_buffer : buffer -> Sexplib0.Sexp.tval resolve_pool : device -> Ir.Backend_intf.buffer_loc -> buffer_ptrBackend-private buffer_loc -> base resolution, used by the backend's own transfer/link implementations. Not part of Backend_intf.