Utils: OcamlDoc for Data_encoding module.
This patch is coathored with @milodavis, @abate, and @klakplok.
This commit is contained in:
parent
e21672c4ac
commit
14597b8f7e
@ -7,7 +7,50 @@
|
||||
(* *)
|
||||
(**************************************************************************)
|
||||
|
||||
(** In memory JSON data *)
|
||||
(** Type-safe serialization and deserialization of data structures. *)
|
||||
|
||||
(** {1 Data Encoding} *)
|
||||
|
||||
(** This module provides type-safe serialization and deserialization of
|
||||
data structures. Backends are provided to both binary and JSON.
|
||||
|
||||
This works by writing type descriptors by hand, using the provided
|
||||
combinators. These combinators can fine-tune the binary
|
||||
representation to be compact and efficient, but also provide
|
||||
proper field names and meta information, so the API of Tezos can
|
||||
be automatically introspected and documented.
|
||||
|
||||
Here is an example encoding for type [(int * string)].
|
||||
|
||||
[let enc = obj2 (req "code" uint16) (req "message" string)]
|
||||
|
||||
In JSON, this encoding maps values of type [int * string] to JSON
|
||||
objects with a field [code] whose value is a number and a field
|
||||
[message] whose value is a string.
|
||||
|
||||
In binary, this encoding maps to two raw bytes for the [int]
|
||||
followed by the size of the string in bytes, and finally the raw
|
||||
contents of the string. This binary format is mostly tagless,
|
||||
meaning that serialized data cannot be interpreted without the
|
||||
encoding that was used for serialization.
|
||||
|
||||
Regarding binary serialization, encodings are classified as either:
|
||||
- fixed size (booleans, integers, numbers)
|
||||
data is always the same size for that type ;
|
||||
- dynamically sized (arbitrary strings and bytes)
|
||||
data is of unknown size and requires an explicit length field ;
|
||||
- variable size (special case of strings, bytes, and arrays)
|
||||
data makes up the remainder of an object of known size,
|
||||
thus its size is given by the context, and does not
|
||||
have to be serialized.
|
||||
|
||||
JSON operations are delegated to [ocplib-json-typed]. *)
|
||||
|
||||
(** The type for serializing or deserializing a value of type ['a]. *)
|
||||
type 'a encoding = 'a t
|
||||
and 'a t
|
||||
|
||||
(** In memory JSON data, compatible with [Ezjsonm]. *)
|
||||
type json =
|
||||
[ `O of (string * json) list
|
||||
| `Bool of bool
|
||||
@ -24,65 +67,163 @@ exception Duplicated_tag of int
|
||||
exception Invalid_tag of int * [ `Uint8 | `Uint16 ]
|
||||
exception Unexpected_enum of string * string list
|
||||
|
||||
type 'a t
|
||||
type 'a encoding = 'a t
|
||||
|
||||
val classify : 'a encoding -> [ `Fixed of int | `Dynamic | `Variable ]
|
||||
|
||||
val splitted : json:'a encoding -> binary:'a encoding -> 'a encoding
|
||||
|
||||
(** Special value [null] in JSON, nothing in binary. *)
|
||||
val null : unit encoding
|
||||
|
||||
(** Empty object (not included in binary, encoded as empty object in JSON). *)
|
||||
val empty : unit encoding
|
||||
|
||||
(** Unit value, ommitted in binary.
|
||||
Serialized as an empty object in JSON, accepts any object when deserializing. *)
|
||||
val unit : unit encoding
|
||||
|
||||
(** Constant string (data is not included in the binary data). *)
|
||||
val constant : string -> unit encoding
|
||||
|
||||
(** Signed 8 bit integer
|
||||
(data is encoded as a byte in binary and an integer in JSON). *)
|
||||
val int8 : int encoding
|
||||
|
||||
(** Unsigned 8 bit integer
|
||||
(data is encoded as a byte in binary and an integer in JSON). *)
|
||||
val uint8 : int encoding
|
||||
|
||||
(** Signed 16 bit integer
|
||||
(data is encoded as a short in binary and an integer in JSON). *)
|
||||
val int16 : int encoding
|
||||
|
||||
(** Unsigned 16 bit integer
|
||||
(data is encoded as a short in binary and an integer in JSON). *)
|
||||
val uint16 : int encoding
|
||||
|
||||
(** Signed 31 bit integer, which corresponds to type int on 32-bit OCaml systems
|
||||
(data is encoded as a 32 bit int in binary and an integer in JSON). *)
|
||||
val int31 : int encoding
|
||||
|
||||
(** Signed 32 bit integer
|
||||
(data is encoded as a 32-bit int in binary and an integer in JSON). *)
|
||||
val int32 : int32 encoding
|
||||
|
||||
(** Signed 64 bit integer
|
||||
(data is encodedas a 64-bit int in binary and a decimal string in JSON). *)
|
||||
val int64 : int64 encoding
|
||||
|
||||
(** Encoding of a boolean
|
||||
(data is encoded as a byte in binary and a boolean in JSON). *)
|
||||
val bool : bool encoding
|
||||
|
||||
(** Encoding of a string
|
||||
- default variable in width
|
||||
- encoded as a byte sequence in binary
|
||||
- encoded as a string in JSON. *)
|
||||
val string : string encoding
|
||||
|
||||
(** Encoding of arbitrary bytes
|
||||
(encoded via hex in JSON and directly as a sequence byte in binary). *)
|
||||
val bytes : MBytes.t encoding
|
||||
|
||||
(** Encoding of floating point number
|
||||
(encoded as a floating point number in JSON and a double in binary). *)
|
||||
val float : float encoding
|
||||
|
||||
(** Combinator to make an optional value
|
||||
(represented as a 1-byte tag followed by the data (or nothing) in binary
|
||||
and either the raw value or an empty object in JSON). *)
|
||||
val option : 'a encoding -> 'a option encoding
|
||||
|
||||
(** Combinator to make a {!result} value
|
||||
(represented as a 1-byte tag followed by the data of either type in binary,
|
||||
and either unwrapped value in JSON (the caller must ensure that both
|
||||
encodings do not collide)). *)
|
||||
val result : 'a encoding -> 'b encoding -> ('a, 'b) result encoding
|
||||
|
||||
(** Encode enumeration via association list
|
||||
(represented as a string in JSON and binary). *)
|
||||
val string_enum : (string * 'a) list -> 'a encoding
|
||||
|
||||
|
||||
(** Create encodings that produce data of a fixed length when binary encoded.
|
||||
See the preamble for an explanation. *)
|
||||
module Fixed : sig
|
||||
|
||||
(** Encode a fixed length string *)
|
||||
val string : int -> string encoding
|
||||
|
||||
(** Encode a fixed length byte sequence *)
|
||||
val bytes : int -> MBytes.t encoding
|
||||
end
|
||||
|
||||
(** Create encodings that produce data of a variable length when binary encoded.
|
||||
See the preamble for an explanation. *)
|
||||
module Variable : sig
|
||||
(** Encode a string *)
|
||||
val string : string encoding
|
||||
|
||||
(** Encode a byte sequence *)
|
||||
val bytes : MBytes.t encoding
|
||||
|
||||
(** Array encoding combinator *)
|
||||
val array : 'a encoding -> 'a array encoding
|
||||
|
||||
(** List encoding combinator *)
|
||||
val list : 'a encoding -> 'a list encoding
|
||||
end
|
||||
|
||||
(** Mark an encoding as being of dynamic size.
|
||||
Forces the size to be stored alongside content when needed.
|
||||
Usually used to fix errors from combining two encodings. *)
|
||||
val dynamic_size : 'a encoding -> 'a encoding
|
||||
|
||||
(** Recompute the encoding definition each time it is used.
|
||||
Useful for dynamically updating the encoding of values of an extensible
|
||||
type via a global reference (e.g. exceptions). *)
|
||||
val delayed : (unit -> 'a encoding) -> 'a encoding
|
||||
|
||||
(** Encodes raw JSON data (BSON is used for binary). *)
|
||||
val json : json encoding
|
||||
|
||||
(** Encodes a JSON schema (BSON encoded for binary). *)
|
||||
val json_schema : json_schema encoding
|
||||
|
||||
(** An enriched encoding to represent a component in a structured
|
||||
type, augmenting the encoding with a name and whether it is a
|
||||
required or optional. Fields are used to encode OCaml tuples as
|
||||
objects in JSON, and as sequences in binary, using combinator
|
||||
{!obj1} and the like. *)
|
||||
type 'a field
|
||||
|
||||
(** Required field. *)
|
||||
val req :
|
||||
?title:string -> ?description:string ->
|
||||
string -> 't encoding -> 't field
|
||||
|
||||
(** Optional field. Omitted entirely in JSON encoding if None.
|
||||
Omitted in binary if the only optional field in a [`Variable]
|
||||
encoding, otherwise a 1-byte prefix (`0` or `1`) tells if the
|
||||
field is present or not. *)
|
||||
val opt :
|
||||
?title:string -> ?description:string ->
|
||||
string -> 't encoding -> 't option field
|
||||
|
||||
(** Optional field of variable length.
|
||||
Only one can be present in a given object. *)
|
||||
val varopt :
|
||||
?title:string -> ?description:string ->
|
||||
string -> 't encoding -> 't option field
|
||||
|
||||
(** Required field with a default value.
|
||||
If the default value is passed, the field is omitted in JSON.
|
||||
The value is always serialized in binary. *)
|
||||
val dft :
|
||||
?title:string -> ?description:string ->
|
||||
string -> 't encoding -> 't -> 't field
|
||||
|
||||
(** {2 Constructors for objects with N fields} *)
|
||||
|
||||
(** These are serialized to binary by converting each internal object to binary
|
||||
and placing them in the order of the original object.
|
||||
These are serialized to JSON as a JSON object with the field names. *)
|
||||
|
||||
val obj1 :
|
||||
'f1 field -> 'f1 encoding
|
||||
val obj2 :
|
||||
@ -116,6 +257,12 @@ val obj10 :
|
||||
'f6 field -> 'f7 field -> 'f8 field -> 'f9 field -> 'f10 field ->
|
||||
('f1 * 'f2 * 'f3 * 'f4 * 'f5 * 'f6 * 'f7 * 'f8 * 'f9 * 'f10) encoding
|
||||
|
||||
(** {2 Constructors for tuples with N fields} *)
|
||||
|
||||
(** These are serialized to binary by converting each internal object to binary
|
||||
and placing them in the order of the original object.
|
||||
These are serialized to JSON as JSON arrays/lists. *)
|
||||
|
||||
val tup1 :
|
||||
'f1 encoding ->
|
||||
'f1 encoding
|
||||
@ -155,45 +302,103 @@ val tup10 :
|
||||
'f9 encoding -> 'f10 encoding ->
|
||||
('f1 * 'f2 * 'f3 * 'f4 * 'f5 * 'f6 * 'f7 * 'f8 * 'f9 * 'f10) encoding
|
||||
|
||||
(** {2 Combinators} *)
|
||||
|
||||
(** Create a larger object from the encodings of two smaller ones.
|
||||
@raise invalid_arg if both arguments are not objects. *)
|
||||
val merge_objs : 'o1 encoding -> 'o2 encoding -> ('o1 * 'o2) encoding
|
||||
|
||||
(** Create a large tuple encoding from two smaller ones.
|
||||
@raise invalid_arg if both values are not tuples. *)
|
||||
val merge_tups : 'a1 encoding -> 'a2 encoding -> ('a1 * 'a2) encoding
|
||||
|
||||
(** Array combinator. *)
|
||||
val array : 'a encoding -> 'a array encoding
|
||||
|
||||
(** List combinator. *)
|
||||
val list : 'a encoding -> 'a list encoding
|
||||
|
||||
(** Association list.
|
||||
An object in JSON, a list of pairs in binary. *)
|
||||
val assoc : 'a encoding -> (string * 'a) list encoding
|
||||
|
||||
(** A partial encoding to represent a case in a variant type. Hides
|
||||
the (existentially bound) type of the parameter to the specific
|
||||
case, providing its encoder, and converter functions to and from
|
||||
the union type. *)
|
||||
type 't case
|
||||
|
||||
(** Encodes a variant constructor. Takes the encoding for the specific
|
||||
parameters, a recognizer function that will extract the parameters
|
||||
in case the expected case of the variant is being serialized, and
|
||||
a constructor function for deserialization.
|
||||
|
||||
The tag must be less than the tag size of the union in which you use the case.
|
||||
An optional tag gives a name to a case and should be used to maintain
|
||||
compatibility.
|
||||
|
||||
If no tag is specified, tags are assigned by the union combinator. *)
|
||||
val case :
|
||||
?tag:int ->
|
||||
'a encoding -> ('t -> 'a option) -> ('a -> 't) -> 't case
|
||||
|
||||
(** Create a single encoding from a series of cases.
|
||||
|
||||
In JSON, all cases are tried one after the other. The caller must
|
||||
check for collisions.
|
||||
|
||||
In binary, a prefix tag is added to discriminate quickly between
|
||||
cases. The default is `Uint8 and you must use a `Uint16 if you are
|
||||
going to have more than 256 cases.
|
||||
|
||||
This function will raise an exception if it is given the empty list
|
||||
or if there are more cases than can fit in the tag size. *)
|
||||
val union :
|
||||
?tag_size:[ `Uint8 | `Uint16 ] -> 't case list -> 't encoding
|
||||
|
||||
(** Add documentation to an encoding. *)
|
||||
val describe :
|
||||
?title:string -> ?description:string ->
|
||||
't encoding ->'t encoding
|
||||
|
||||
(** Give a name to an encoding. *)
|
||||
val def : string -> 'a encoding -> 'a encoding
|
||||
|
||||
(** Provide a transformer from one encoding to a different one.
|
||||
|
||||
Used to simplify nested encodings or to change the generic tuples
|
||||
built by {obj1}, {tup1} and the like into proper records.
|
||||
|
||||
A schema may optionally be provided as documentation of the new encoding. *)
|
||||
val conv :
|
||||
('a -> 'b) -> ('b -> 'a) ->
|
||||
?schema:Json_schema.schema ->
|
||||
'b encoding -> 'a encoding
|
||||
|
||||
(** Combinator for recursive encodings. *)
|
||||
val mu : string -> ('a encoding -> 'a encoding) -> 'a encoding
|
||||
|
||||
module Json : sig
|
||||
|
||||
(** Create a {!Json_encoding.encoding} from an {encoding}. *)
|
||||
val convert : 'a encoding -> 'a Json_encoding.encoding
|
||||
|
||||
(** Generate a schema from an {!encoding}. *)
|
||||
val schema : 'a encoding -> json_schema
|
||||
|
||||
|
||||
(** Construct a JSON object from an encoding. *)
|
||||
val construct : 't encoding -> 't -> json
|
||||
|
||||
(** Destruct a JSON object into a value.
|
||||
Fail with an exception if the JSON object and encoding do not match.. *)
|
||||
val destruct : 't encoding -> json -> 't
|
||||
|
||||
(** JSON Error *)
|
||||
(** JSON Error. *)
|
||||
|
||||
type path = path_item list
|
||||
|
||||
(** A set of accessors that point to a location in a JSON object. *)
|
||||
and path_item =
|
||||
[ `Field of string
|
||||
(** A field in an object. *)
|
||||
@ -233,6 +438,12 @@ module Json : sig
|
||||
|
||||
end
|
||||
|
||||
(** Classify an encoding wrt. its binary serialization as explained in the preamble. *)
|
||||
val classify : 'a encoding -> [ `Fixed of int | `Dynamic | `Variable ]
|
||||
|
||||
(** Define different encodings for JSON and binary serialization. *)
|
||||
val splitted : json:'a encoding -> binary:'a encoding -> 'a encoding
|
||||
|
||||
module Binary : sig
|
||||
|
||||
val length : 'a encoding -> 'a -> int
|
||||
@ -250,7 +461,7 @@ module Binary : sig
|
||||
can be garbage-collected only when all the blocks are
|
||||
unreachable (because of the 'optimized' implementation of
|
||||
MBytes.sub used internally *)
|
||||
val to_bytes_list : ?copy_blocks:bool -> int -> 'a t -> 'a -> MBytes.t list
|
||||
val to_bytes_list : ?copy_blocks:bool -> int -> 'a encoding -> 'a -> MBytes.t list
|
||||
|
||||
(** This type is used when decoding binary data incrementally.
|
||||
- In case of 'Success', the decoded data, the size of used data
|
||||
@ -268,13 +479,13 @@ module Binary : sig
|
||||
'Fixed' or a 'Dynamic' size, otherwise an exception
|
||||
'Invalid_argument "streaming data with variable size"' is
|
||||
raised *)
|
||||
val read_stream_of_bytes : ?init:MBytes.t list -> 'a t -> 'a status
|
||||
val read_stream_of_bytes : ?init:MBytes.t list -> 'a encoding -> 'a status
|
||||
|
||||
(** Like read_stream_of_bytes, but only checks that the stream can
|
||||
be read. Note that this is an approximation because failures
|
||||
that may come from conversion functions present in encodings are
|
||||
not checked *)
|
||||
val check_stream_of_bytes : ?init:MBytes.t list -> 'a t -> unit status
|
||||
val check_stream_of_bytes : ?init:MBytes.t list -> 'a encoding -> unit status
|
||||
|
||||
val fixed_length : 'a encoding -> int option
|
||||
val fixed_length_exn : 'a encoding -> int
|
||||
|
Loading…
Reference in New Issue
Block a user