Arrayjit.Ops
Operation types shared by all backends; and precision types.
module Lazy = Utils.Lazy
type ('ocaml, 'impl) precision =
| Byte : (Base.char, uint8_elt) precision
| Half : (Base.float, float16_elt) precision
| Single : (Base.float, float32_elt) precision
| Double : (Base.float, float64_elt) precision
val sexp_of_precision :
'ocaml 'impl. ('ocaml -> Sexplib0.Sexp.t) ->
('impl -> Sexplib0.Sexp.t) ->
('ocaml, 'impl) precision ->
Sexplib0.Sexp.t
type prec =
| Void_prec
| Byte_prec of (Base.char, uint8_elt) precision
| Half_prec of (Base.float, float16_elt) precision
| Single_prec of (Base.float, float32_elt) precision
| Double_prec of (Base.float, float64_elt) precision
val byte : prec
val half : prec
val single : prec
val double : prec
val is_up_to_fp16 : prec -> bool
val sexp_of_prec : prec -> Base.Sexp.t
val prec_of_sexp : Base.Sexp.t -> prec
val precision_to_string : ('ocaml, 'elt_t) precision -> string
val prec_string : prec -> string
val prec_in_bytes : prec -> int
val c_typ_of_prec : prec -> string
val hum_typ_of_prec : prec -> string
See: tinygrad ops, CUDA Math API (intrinsics).
This is a redundant set of operations, aiming to expose hardware-supported "intrinsics", to reduce the need for backends to pattern-match and optimize. Also for convenience.
type init_op =
| Constant_fill of {
}
Fills in the numbers where the rightmost axis is contiguous. If strict=true
, loops over the provided values.
| Range_over_offsets
Fills in the offset number of each cell (i.e. how many cells away it is from the beginning).
*)| Standard_uniform
Draws the values from U(0,1).
*)| File_mapped of Base.string * prec
Reads the data using Unix.openfile
and Unix.map_file
.
Initializes or resets a array by filling in the corresponding numbers, at the appropriate precision.
val init_op_of_sexp : Sexplib0.Sexp.t -> init_op
val sexp_of_init_op : init_op -> Sexplib0.Sexp.t
val binop_of_sexp : Sexplib0.Sexp.t -> binop
val sexp_of_binop : binop -> Sexplib0.Sexp.t
val unop_of_sexp : Sexplib0.Sexp.t -> unop
val sexp_of_unop : unop -> Sexplib0.Sexp.t
val ternop_of_sexp : Sexplib0.Sexp.t -> ternop
val sexp_of_ternop : ternop -> Sexplib0.Sexp.t
val op_of_sexp : Sexplib0.Sexp.t -> op
val sexp_of_op : op -> Sexplib0.Sexp.t
val neutral_elem : binop -> Base.Float.t
Either the left-neutral or right-neutral element of the operation. Unspecified if the operation does not have a neutral element.
val interpret_binop : binop -> Base.Float.t -> Base.Float.t -> Base.Float.t
val interpret_unop : unop -> Base.Float.t -> Base.Float.t
val interpret_ternop :
ternop ->
Base.Float.t ->
Base.Float.t ->
Base.Float.t ->
Base.Float.t
Note: currently the %cd syntax only supports infix binops as assignment ops.
val is_binop_nice_infix : binop -> bool
val binop_cd_syntax : binop -> string
val binop_cd_fallback_syntax : binop -> string
In the %cd syntax, we support uncurried notation for binary ops in addition to the infix notation.
val is_assign_op : binop -> bool
val assign_op_cd_syntax : initialize_neutral:bool -> binop -> string
val unop_cd_syntax : unop -> string
Note: currently we do not support unary prefix symbols.
val ternop_cd_syntax : ternop -> string
In the %cd syntax, we use uncurried notation for ternary ops.
val c_rawptr_to_string : Base.nativeint -> prec -> Base.String.t
val rawptr_to_string_hum : Base.nativeint -> prec -> Base.String.t
val c_ptr_to_string : 'elem Ctypes.ptr -> prec -> Base.String.t
val ptr_to_string_hum : 'elem Ctypes.ptr -> prec -> Base.String.t
type global_identifier =
| C_function of Base.string
Calls a no-argument or indices-arguments C function.
*)| External_unsafe of {
}
| Merge_buffer of {
}
Each device has at most one merge buffer, which is re-used, and re-allocated as needed, by merge operations. The merge buffer is associated with the source node of the device's most recent device_to_device ~into_merge_buffer:true
operation.
val sexp_of_global_identifier : global_identifier -> Sexplib0.Sexp.t
val equal_global_identifier :
global_identifier ->
global_identifier ->
Base.bool
val compare_global_identifier :
global_identifier ->
global_identifier ->
Base.int