-
Notifications
You must be signed in to change notification settings - Fork 31
/
Copy pathstream.ml
359 lines (321 loc) · 12 KB
/
stream.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
(* Copyright (c) 2017 Anil Madhavapeddy <anil@recoil.org>
*
* Permission to use, copy, modify, and distribute this software for any
* purpose with or without fee is hereby granted, provided that the above
* copyright notice and this permission notice appear in all copies.
*
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. *)
open Types
module B = Yaml_ffi.M
module T = Yaml_types.M
type tag_directive = { handle : string; prefix : string } [@@deriving sexp]
let error_to_msg e =
match e with
| `None -> "No error"
| `Memory -> "Reader error"
| `Scanner -> "Scanner error"
| `Parser -> "Parser error"
| `Composer -> "Compose error"
| `Writer -> "Writer error"
| `Emitter -> "Emitter error"
| `E i -> "Unknown error code " ^ Int64.to_string i
let scalar_style_of_ffi s : scalar_style =
match s with
| `Any -> `Any
| `Plain -> `Plain
| `Single_quoted -> `Single_quoted
| `Double_quoted -> `Double_quoted
| `Literal -> `Literal
| `Folded -> `Folded
| `E err ->
raise (Invalid_argument ("invalid scalar style" ^ Int64.to_string err))
let layout_style_of_ffi s : layout_style =
match s with
| `Any -> `Any
| `Block -> `Block
| `Flow -> `Flow
| `E err ->
raise (Invalid_argument ("invalid mapping style" ^ Int64.to_string err))
let layout_style_of_ffi s : layout_style =
match s with
| `Any -> `Any
| `Block -> `Block
| `Flow -> `Flow
| `E err ->
raise (Invalid_argument ("invalid sequence style" ^ Int64.to_string err))
let encoding_of_ffi e : encoding =
match e with
| `Any -> `Any
| `Utf16be -> `Utf16be
| `Utf16le -> `Utf16le
| `Utf8 -> `Utf8
| `E err ->
raise (Invalid_argument ("invalid encoding " ^ Int64.to_string err))
let tag_directive_of_ffi e =
let open Ctypes in
let handle = !@(e |-> T.Tag_directive.handle) in
let prefix = !@(e |-> T.Tag_directive.prefix) in
{ handle; prefix }
let list_of_tag_directives tds =
let open Ctypes in
let module TEDT = T.Event.Document_start.Tag_directives in
let hd = !@(tds |-> TEDT.start) in
(* TODO not clear how to parse this as not a linked list *)
let acc = [ hd ] in
List.map tag_directive_of_ffi acc
let version_of_directive ~major ~minor =
match (major, minor) with
| 1, 1 -> `V1_1
| 1, 2 -> `V1_2
| _ ->
raise
(Invalid_argument
(Printf.sprintf "Unsupported Yaml version %d.%d" major minor))
let directive_of_version = function `V1_1 -> (1, 1) | `V1_2 -> (1, 2)
module Mark = struct
type t = { index : int; line : int; column : int } [@@deriving sexp]
let of_ffi m =
let open Ctypes in
let int_field f = getf m f |> Unsigned.Size_t.to_int in
let index = int_field T.Mark.index in
let line = int_field T.Mark.line in
let column = int_field T.Mark.column in
{ index; line; column }
end
module Event = struct
type pos = { start_mark : Mark.t; end_mark : Mark.t }
type t =
| Stream_start of { encoding : encoding }
| Document_start of { version : version option; implicit : bool }
| Document_end of { implicit : bool }
| Mapping_start of {
anchor : string option;
tag : string option;
implicit : bool;
style : layout_style;
}
| Mapping_end
| Stream_end
| Scalar of scalar
| Sequence_start of {
anchor : string option;
tag : string option;
implicit : bool;
style : layout_style;
}
| Sequence_end
| Alias of { anchor : string }
| Nothing
let of_ffi e : t * pos =
let open T.Event in
let open Ctypes in
let ty = getf e _type in
let data = getf e data in
let start_mark = getf e start_mark |> Mark.of_ffi in
let end_mark = getf e end_mark |> Mark.of_ffi in
let pos = { start_mark; end_mark } in
let r =
match ty with
| `Stream_start ->
let start = getf data Data.stream_start in
let encoding = getf start Stream_start.encoding |> encoding_of_ffi in
Stream_start { encoding }
| `Document_start ->
let ds = getf data Data.document_start in
let version =
let vd = getf ds Document_start.version_directive in
match vd with
| None -> None
| Some vd ->
let vd = !@vd in
let major = getf vd T.Version_directive.major in
let minor = getf vd T.Version_directive.minor in
Some (version_of_directive ~major ~minor)
in
let implicit = getf ds Document_start.implicit <> 0 in
Document_start { version; implicit }
| `Mapping_start ->
let ms = getf data Data.mapping_start in
let anchor = getf ms Mapping_start.anchor in
let tag = getf ms Mapping_start.tag in
let implicit = getf ms Mapping_start.implicit <> 0 in
let style = getf ms Mapping_start.style |> layout_style_of_ffi in
Mapping_start { anchor; tag; implicit; style }
| `Scalar ->
let s = getf data Data.scalar in
let anchor = getf s Scalar.anchor in
let tag = getf s Scalar.tag in
let value = getf s Scalar.value in
let plain_implicit = getf s Scalar.plain_implicit <> 0 in
let quoted_implicit = getf s Scalar.quoted_implicit <> 0 in
let style = getf s Scalar.style |> scalar_style_of_ffi in
Scalar { anchor; tag; value; plain_implicit; quoted_implicit; style }
| `Document_end ->
let de = getf data Data.document_end in
let implicit = getf de Document_end.implicit <> 0 in
Document_end { implicit }
| `Sequence_start ->
let ss = getf data Data.sequence_start in
let anchor = getf ss Sequence_start.anchor in
let tag = getf ss Sequence_start.tag in
let implicit = getf ss Sequence_start.implicit <> 0 in
let style = getf ss Sequence_start.style |> layout_style_of_ffi in
Sequence_start { anchor; tag; implicit; style }
| `Sequence_end -> Sequence_end
| `Mapping_end -> Mapping_end
| `Stream_end -> Stream_end
| `Alias ->
let a = getf data Data.alias in
let anchor =
match getf a Alias.anchor with
| None -> raise (Invalid_argument "empty anchor alias")
| Some a -> a
in
Alias { anchor }
| `None -> Nothing
| `E i ->
raise
(Invalid_argument
("Unexpected event, internal library error " ^ Int64.to_string i))
in
(r, pos)
end
let version = B.version
let get_version () =
let major = Ctypes.(allocate int 0) in
let minor = Ctypes.(allocate int 0) in
let patch = Ctypes.(allocate int 0) in
B.get_version major minor patch;
let major = Ctypes.(!@major) in
let minor = Ctypes.(!@minor) in
let patch = Ctypes.(!@patch) in
(major, minor, patch)
type parser = {
p : T.Parser.t Ctypes.structure Ctypes.ptr;
event : T.Event.t Ctypes.structure Ctypes.ptr;
buf : char Ctypes_static.carray;
}
let parser str =
let p = Ctypes.(allocate_n T.Parser.t ~count:1) in
let event = Ctypes.(allocate_n T.Event.t ~count:1) in
let r = B.parser_init p in
let buf = Ctypes.CArray.of_string str in
let buf_ptr = Ctypes.CArray.start buf in
let len = String.length str |> Unsigned.Size_t.of_int in
B.parser_set_input_string p buf_ptr len;
match r with
| 1 -> Ok { buf; p; event }
| n -> Error (`Msg ("error initialising parser: " ^ string_of_int n))
let do_parse { p; event } =
let open Ctypes in
let r = B.parser_parse p event in
let describe_problem () =
match Ctypes.(getf !@p T.Parser.problem) with
| None -> "(no problem description)"
| Some s ->
let pv = Ctypes.(getf !@p T.Parser.problem_value) in
let po = Ctypes.(getf !@p T.Parser.problem_offset) in
s
^ " character "
^ string_of_int pv
^ " position "
^ Unsigned.Size_t.to_string po
in
match r with
| 1 -> Event.of_ffi !@event |> Result.ok
| n ->
Error
(`Msg
("error calling parser: "
^ describe_problem ()
^ " returned: "
^ string_of_int n))
type emitter = {
e : T.Emitter.t Ctypes.structure Ctypes.ptr;
event : T.Event.t Ctypes.structure Ctypes.ptr;
buf : char Ctypes.ptr;
written : Unsigned.size_t Ctypes.ptr;
}
let emitter_written { written; _ } =
Ctypes.(!@written) |> Unsigned.Size_t.to_int
let emitter ?(len = 65535 * 4) () =
let e = Ctypes.(allocate_n T.Emitter.t ~count:1) in
let event = Ctypes.(allocate_n T.Event.t ~count:1) in
let written = Ctypes.allocate_n Ctypes.size_t ~count:1 in
let r = B.emitter_init e in
let buf = Ctypes.(allocate_n Ctypes.char ~count:len) in
let len = Unsigned.Size_t.of_int len in
B.emitter_set_output_string e buf len written;
match r with
| 1 -> Ok { e; event; written; buf }
| n -> Error (`Msg ("error initialising emitter: " ^ string_of_int n))
let emitter_buf { buf; written } =
let length = Ctypes.(!@written) |> Unsigned.Size_t.to_int in
Ctypes.string_from_ptr buf ~length
let check l a =
match a with
| 0 -> Error (`Msg (l ^ " failed"))
| 1 -> Ok ()
| n -> Error (`Msg ("unexpected return value: " ^ string_of_int n))
let check_emit l { e; event } a =
Result.bind (check l a) @@ fun () -> check l @@ B.emitter_emit e event
let stream_start t encoding =
check_emit "stream_start" t
@@ B.stream_start_event_init t.event (encoding :> T.Encoding.t)
let stream_end t = check_emit "stream_end" t @@ B.stream_end_event_init t.event
let document_start ?version ?(implicit = true) t =
let open Ctypes in
let ver =
match version with
| None -> from_voidp T.Version_directive.t null
| Some v ->
let major, minor = directive_of_version v in
let v = make T.Version_directive.t in
setf v T.Version_directive.major major;
setf v T.Version_directive.minor minor;
allocate T.Version_directive.t @@ v
in
let tag = from_voidp T.Tag_directive.t null in
check_emit "doc_start" t
@@ B.document_start_event_init t.event ver tag tag implicit
let document_end ?(implicit = true) t =
check_emit "doc_end" t @@ B.document_end_event_init t.event implicit
let scalar { plain_implicit; quoted_implicit; anchor; tag; style; value } t =
check_emit "scalar" t
@@ B.scalar_event_init t.event anchor tag value (String.length value)
plain_implicit quoted_implicit
(style :> T.Scalar_style.t)
let sequence_start ?anchor ?tag ?(implicit = true) ?(style = `Block) t =
check_emit "seq_start" t
@@ B.sequence_start_event_init t.event anchor tag implicit
(style :> T.Sequence_style.t)
let sequence_end t = check_emit "seq_end" t @@ B.sequence_end_event_init t.event
let mapping_start ?anchor ?tag ?(implicit = true) ?(style = `Block) t =
check_emit "mapping_start" t
@@ B.mapping_start_event_init t.event anchor tag implicit
(style :> T.Mapping_style.t)
let mapping_end t =
check_emit "mapping_end" t @@ B.mapping_end_event_init t.event
let alias t value = check_emit "alias" t @@ B.alias_event_init t.event value
let emit t =
let open Event in
function
| Stream_start { encoding } -> stream_start t encoding
| Document_start { version; implicit } -> document_start ?version ~implicit t
| Document_end { implicit } -> document_end ~implicit t
| Mapping_start { anchor; tag; implicit; style } ->
mapping_start ?anchor ?tag ~implicit ~style t
| Mapping_end -> mapping_end t
| Stream_end -> stream_end t
| Scalar s -> scalar s t
| Sequence_start { anchor; tag; implicit; style } ->
sequence_start ?anchor ?tag ~implicit ~style t
| Sequence_end -> sequence_end t
| Alias { anchor } -> alias t anchor
| Nothing -> Ok ()