Skip to content

Commit

Permalink
Add documentation of the Codecs.Chain module.
Browse files Browse the repository at this point in the history
  • Loading branch information
zoj613 committed Jul 11, 2024
1 parent bae4aaa commit 02cc5d7
Showing 1 changed file with 43 additions and 0 deletions.
43 changes: 43 additions & 0 deletions lib/codecs/codecs.mli
Original file line number Diff line number Diff line change
@@ -1,69 +1,112 @@
(** An array has an associated list of codecs. Each codec specifies a
bidirectional transform (an encode transform and a decode transform).
This module contains building blocks for creating and working with
a chain of codecs. *)

module Ndarray = Owl.Dense.Ndarray.Generic

(** The type of [array -> array] codecs. *)
type arraytoarray =
[ `Transpose of int array ]

(** A type representing valid Gzip codec compression levels. *)
type compression_level =
| L0 | L1 | L2 | L3 | L4 | L5 | L6 | L7 | L8 | L9

(** A type representing [bytes -> bytes] codecs that produce
fixed sized encoded strings. *)
type fixed_bytestobytes =
[ `Crc32c ]

(** A type representing [bytes -> bytes] codecs that produce
variable sized encoded strings. *)
type variable_bytestobytes =
[ `Gzip of compression_level ]

(** The type of [bytes -> bytes] codecs. *)
type bytestobytes =
[ fixed_bytestobytes | variable_bytestobytes ]

(** A type representing the configured endianness of an array. *)
type endianness = Little | Big

(** A type representing the location of a shard's index array in
an encoded byte string. *)
type loc = Start | End

(** The type of [array -> bytes] codecs. *)
type arraytobytes =
[ `Bytes of endianness
| `ShardingIndexed of sharding_config ]

(** A type representing the Sharding indexed codec's configuration parameters. *)
and sharding_config =
{chunk_shape : int array
;codecs : bytestobytes shard_chain
;index_codecs : fixed_bytestobytes shard_chain
;index_location : loc}

(** A type representing the chain of codecs used to encode/decode
a shard's bytes and its index array. *)
and 'a shard_chain = {
a2a: arraytoarray list;
a2b: arraytobytes;
b2b: 'a list;
}

(** A type used to build a user-defined chain of codecs when creating a Zarr array. *)
type codec_chain = {
a2a: arraytoarray list;
a2b: arraytobytes;
b2b: bytestobytes list;
}

(** The type of errors returned upon failure when an calling a function
on a {!Chain} type. *)
type error =
[ `Extension of string
| `Gzip of Ezgzip.error
| `Transpose_order of int array * string
| `Sharding of int array * int array * string ]

(** A module containing functions to encode/decode an array chunk using a
predefined set of codecs. *)
module Chain : sig
(** A type representing a valid chain of codecs for
decoding/encoding a Zarr array chunk. *)
type t

(** [create r c] returns a type representing a chain of codecs defined by
chain [c] and decoded array representation type [r]. *)
val create :
('a, 'b) Util.array_repr -> codec_chain -> (t, [> error ]) result

(** [default] returns the default codec chain that contains only
the required codecs as defined in the Zarr Version 3 specification. *)
val default : t

(** [compute_encoded_size init t] returns the size (in bytes) of the
encoded byte string given the size [init] of its decoded representation. *)
val compute_encoded_size : int -> t -> int

(** [encode t x] computes the encoded byte string representation of
array chunk [x]. Returns an error upon failure. *)
val encode :
t -> ('a, 'b) Ndarray.t -> (string, [> error ]) result

(** [decode t repr x] decodes the byte string [x] using codec chain [t]
and decoded representation type [repr]. Returns an error upon failure.*)
val decode :
t -> ('a, 'b) Util.array_repr -> string -> (('a, 'b) Ndarray.t, [> error]) result

(** [x = y] returns true if chain [x] is equal to chain [y],
and false otherwise. *)
val ( = ) : t -> t -> bool

(** [of_yojson x] returns a code chain of type {!t} from its json object
representation. *)
val of_yojson : Yojson.Safe.t -> (t, string) result

(** [to_yojson x] returns a json object representation of codec chain [x]. *)
val to_yojson : t -> Yojson.Safe.t
end

0 comments on commit 02cc5d7

Please sign in to comment.