Backend_intf.Backend
include Backend_common
include Backend_any_common
val sexp_of_code : code -> Sexplib0.Sexp.t
val sexp_of_code_batch : code_batch -> Sexplib0.Sexp.t
val compile :
?name:Base.string ->
Indexing.unit_bindings ->
Assignments.comp ->
code
name
is used to derive names for compilation artifacts. If omitted, it's derived via Assignments.get_name_exn
.
val compile_batch :
?names:Base.string Base.array ->
?occupancy:(name:Base.string -> src_n:Base.int -> Base.bool) ->
Indexing.unit_bindings ->
Assignments.comp Base.array ->
code_batch
compile_batch
vs. compile
is mostly about improving the compile time and debugging convenience by generating fewer files -- ideally does not affect execution, but there can be backend-specific differences. Only array entries for which occupancy
returns true are included. names
are used to derive names for compilation artifacts. If omitted, they're derived via Assignments.get_name_exn
.
include Backend_device_common with type buffer_ptr := buffer_ptr
include Device with type buffer_ptr := buffer_ptr
include Device_types with type buffer_ptr := buffer_ptr
include Device_config with type buffer_ptr := buffer_ptr
include Buffer with type buffer_ptr := buffer_ptr
include sig ... end
val sexp_of_dev : dev -> Sexplib0.Sexp.t
val sexp_of_runner : runner -> Sexplib0.Sexp.t
An event tracks if a stream finished computing past a particular point in its schedue. These values are used internally for scheduling across streams of the backend, and can be used for explicit scheduling.
val sexp_of_event : event -> Sexplib0.Sexp.t
type nonrec device = (buffer_ptr, dev, runner, event) device
val sexp_of_device : device -> Sexplib0.Sexp.t
type nonrec stream = (buffer_ptr, dev, runner, event) stream
val sexp_of_stream : stream -> Sexplib0.Sexp.t
type nonrec context = (buffer_ptr, stream) context
val sexp_of_context : context -> Sexplib0.Sexp.t
include Alloc_buffer
with type buffer_ptr := buffer_ptr
and type stream := stream
include Buffer with type buffer_ptr := buffer_ptr
include sig ... end
val alloc_buffer :
?old_buffer:buffer_ptr buffer ->
size_in_bytes:Base.int ->
stream ->
buffer_ptr buffer
val alloc_zero_init_array :
Ops.prec ->
dims:Base.int Base.array ->
stream ->
buffer_ptr
val free_buffer : (stream -> buffer_ptr -> Base.unit) Base.option
val make_context : ?ctx_arrays:buffer_ptr ctx_arrays -> stream -> context
Returns a context without a parent.
val make_child : ?ctx_arrays:buffer_ptr ctx_arrays -> context -> context
Returns a context with the same Backend_intf.context.stream
, and Backend_intf.context.ctx_arrays
if omitted, as the given context's, which is also the Backend_intf.context.parent
.
val get_name : stream -> Base.string
include Backend_any_common with type buffer_ptr := buffer_ptr
include Buffer with type buffer_ptr := buffer_ptr
val sexp_of_buffer_ptr : buffer_ptr -> Sexplib0.Sexp.t
include sig ... end
type nonrec buffer = buffer_ptr buffer
val sexp_of_buffer : buffer -> Sexplib0.Sexp.t
type nonrec ctx_arrays = buffer_ptr ctx_arrays
val sexp_of_ctx_arrays : ctx_arrays -> Sexplib0.Sexp.t
val initialize : config -> Base.unit
Initializes a backend before first use. Typically does nothing if the backend is already initialized, but some backends can do some safe cleanups.
Returns false if there was no previous initialize
call. If it returns false, one must call initialize
before using the backend.
val sync : event -> Base.unit
Blocks till the event completes, if it's not done already.
It is rarely needed to call sync
explicitly, because it should always be called internally when necessary, in particular before extracting values from host.
val is_done : event -> Base.bool
Whether the event completed.
Schedules waiting for the given event on the context's stream.
NOTE: it should rarely be needed to call will_wait_for
explicitly, because it should always be called internally when necessary.
val get_used_memory : device -> Base.int
Returns (an upper bound of) the memory used for arrays, in bytes.
Global debug information; backend-specific and might evolve independently on the backends.
val get_debug_info : stream -> Base.Sexp.t
Per-stream debug information; backend-specific and might evolve independently on the backends
val await : stream -> Base.unit
Blocks till the stream becomes idle, i.e. synchronizes the stream.
Returns the event indicating if any currently running or scheduled computations on the stream have completed.
val is_idle : stream -> Base.bool
Whether the stream is currently waiting for work.
val get_device : ordinal:Base.int -> device
val suggested_num_streams : device -> Base.int
The optimal number of streams for the given device to follow the Backend_intf.config
strategy.
Returns the routine for the code's procedure, in a new context derived from the given context.
val link_batch :
context ->
code_batch ->
context * context routine Base.option Base.array
Returns the routines for the procedures included in the code batch. The returned context is downstream of all the returned routines.
include With_buffer_retrieval_and_syncing
with type device := device
and type context := context
and type event := event
If the tensor node is both hosted and in-context, schedules a copy from host to context and returns true, otherwise returns false.
If the tensor node is both hosted and in-context, schedules a copy from context to host and returns true, otherwise returns false.
val device_to_device :
Tnode.t ->
into_merge_buffer:merge_buffer_use ->
dst:context ->
src:context ->
Base.bool
device_to_device tn ~into_merge_buffer ~dst ~src
proceeds as follows:
src
context and either it is present in the dst
context or into_merge_buffer
is different from No
: raises an error.dst
and into_merge_buffer=No
: returns false.src
to finish, if any.into_merge_buffer=No
: schedules a copy of the tensor node from src
to dst
and updates the writer event for the node.into_merge_buffer
is different from No
: sets on dst
the merge buffer source to the given node.into_merge_buffer=Streaming_for task
, remembers the buffer pointer of the source node to use for streaming, runs task
-- intended to be the routine making use of the merge buffer, and initializes the merge buffer's streaming event.into_merge_buffer=Copy
, schedules copying from src
to the merge buffer of dst
's stream, and updates the writer event for the merge buffer.val sync_device : device -> Base.unit
Synchronizes all the streams on a device, and cleans up (removes) all associated events.