Skip to content

Commit

Permalink
Support optional chunk_key_encoding configuration.
Browse files Browse the repository at this point in the history
Ensures that optional chunk_key_encoding configuration is honored.
If not specified a default value is used, and this default configuration
is not written to the jSON when serializing a metadata type.
  • Loading branch information
zoj613 committed Jul 11, 2024
1 parent 6589fb5 commit e2bf47c
Show file tree
Hide file tree
Showing 2 changed files with 56 additions and 25 deletions.
44 changes: 25 additions & 19 deletions lib/extensions.ml
Original file line number Diff line number Diff line change
Expand Up @@ -71,14 +71,14 @@ end

module ChunkKeyEncoding = struct
type kind = Default | V2
type t = {name : kind; sep : string}
type t = {name : kind; sep : string; is_default : bool}

let create = function
| `Dot -> {name = Default; sep = "."}
| `Slash -> {name = Default; sep = "/"}
| `Dot -> {name = Default; sep = "."; is_default = false}
| `Slash -> {name = Default; sep = "/"; is_default = false}

(* map a chunk coordinate index to a key. E.g, (2,3,1) maps to c/2/3/1 *)
let encode {name; sep} index =
let encode {name; sep; _} index =
let f i acc =
string_of_int i :: acc
in
Expand All @@ -95,31 +95,37 @@ module ChunkKeyEncoding = struct
Array.fold_right f index []

let ( = ) x y =
x.name = y.name && x.sep = y.sep
x.name = y.name && x.sep = y.sep && x.is_default = y.is_default

let to_yojson {name; sep} =
let to_yojson {name; sep; is_default} =
let str =
match name with
| Default -> "default"
| V2 -> "v2"
in
`Assoc
[("name", `String str)
;("configuration", `Assoc [("separator", `String sep)])]
if is_default then
`Assoc [("name", `String str)]
else
`Assoc
[("name", `String str)
;("configuration", `Assoc [("separator", `String sep)])]

let of_yojson x =
match
Util.get_name x,
Yojson.Safe.Util.(member "configuration" x |> to_assoc)
Util.get_name x, Yojson.Safe.Util.member "configuration" x
with
| "default", [("separator", `String "/")] ->
Ok {name = Default; sep = "/"}
| "default", [("separator", `String ".")] ->
Ok {name = Default; sep = "."}
| "v2", [("separator", `String "/")] ->
Ok {name = V2; sep = "/"}
| "v2", [("separator", `String ".")] ->
Ok {name = V2; sep = "."}
| "default", `Null ->
Ok {name = Default; sep = "/"; is_default = true}
| "default", `Assoc [("separator", `String "/")] ->
Ok {name = Default; sep = "/"; is_default = false}
| "default", `Assoc [("separator", `String ".")] ->
Ok {name = Default; sep = "."; is_default = false}
| "v2", `Null ->
Ok {name = V2; sep = "."; is_default = true}
| "v2", `Assoc [("separator", `String "/")] ->
Ok {name = V2; sep = "/"; is_default = false}
| "v2", `Assoc [("separator", `String ".")] ->
Ok {name = V2; sep = "."; is_default = false}
| _ -> Error "Invalid chunk key encoding configuration."
end

Expand Down
37 changes: 31 additions & 6 deletions test/test_metadata.ml
Original file line number Diff line number Diff line change
Expand Up @@ -183,8 +183,7 @@ let test_encode_decode_fill_value fv =
"fill_value": %s,
"chunk_grid":
{"name": "regular", "configuration": {"chunk_shape": [100, 10]}},
"chunk_key_encoding":
{"name": "default", "configuration": {"separator": "."}},
"chunk_key_encoding": {"name": "default"},
"attributes": {"question": 7}}|} fv
in
let expected = Yojson.Safe.from_string str in
Expand Down Expand Up @@ -267,8 +266,7 @@ let array = [
"zarr_format": 3,
"shape": [10000, 1000],
"data_type": "float64",
"chunk_key_encoding":
{"name": "v2", "configuration": {"separator": "."}},
"chunk_key_encoding": {"name": "v2"},
"codecs": [
{"name": "bytes", "configuration": {"endian": "big"}}],
"fill_value": "0x7fc00000",
Expand Down Expand Up @@ -340,8 +338,7 @@ let array = [
"node_type": "array",
"shape": [10000, 1000],
"data_type": "float64",
"chunk_key_encoding":
{"name": "v2", "configuration": {"separator": "."}},
"chunk_key_encoding": {"name": "v2"},
"codecs":
{"name": "bytes", "configuration": {"endian": "big"}},
"fill_value": "0x7fc00000",
Expand Down Expand Up @@ -469,6 +466,34 @@ let array = [
~str:(template {|"UNKNOWN"|} {|[2, 4]|})
~msg:"Invalid Chunk grid name or configuration.";

(* test if decoding a chunk key encoding field without a configuration
leads to a default value being used. *)
let str = {|{
"zarr_format": 3,
"shape": [10000, 1000],
"node_type": "array",
"data_type": "float64",
"codecs": [
{"name": "bytes", "configuration": {"endian": "big"}}],
"fill_value": "0x7fc00000",
"chunk_grid":
{"name": "regular", "configuration": {"chunk_shape": [10, 10]}},
"chunk_key_encoding": {"name": "v2"}}|} in
(match ArrayMetadata.of_yojson @@ Yojson.Safe.from_string str with
| Ok meta ->
(* we except it to use the default "." separator. *)
assert_equal
~printer:Fun.id "2.0.1" @@ ArrayMetadata.chunk_key meta [|2; 0; 1|];
(* we expect the default (unspecified) config seperator to be
dropped when serializing the metadata to JSON format. *)
assert_equal
~printer:Fun.id
Yojson.Safe.(from_string str |> to_string) @@
ArrayMetadata.encode meta;
| Error _ ->
assert_failure
"Decoding a well formed array JSON metadata should not fail.");

(* test if the decoding fails if chunk key encoding contains unknown
* separator or name. *)
let str = {|{
Expand Down

0 comments on commit e2bf47c

Please sign in to comment.