Source file CCCanonical_sexp.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
(** {1 Simple S-expression parsing/printing} *)
type 'a or_error = ('a, string) result
type 'a gen = unit -> 'a option
module type SEXP = CCSexp_intf.BASIC_SEXP
module type S = CCSexp_intf.S0
let equal_string (a : string) b = Stdlib.( = ) a b
let compare_string (a : string) b = Stdlib.compare a b
let _with_in filename f =
let ic = open_in filename in
try
let x = f ic in
close_in ic;
x
with e ->
close_in ic;
Error (Printexc.to_string e)
let _with_out filename f =
let oc = open_out filename in
try
let x = f oc in
close_out oc;
x
with e ->
close_out oc;
raise e
module Make (Sexp : SEXP) = struct
type t = Sexp.t
type sexp = t
let atom = Sexp.atom
let list = Sexp.list
let of_int x = Sexp.atom (string_of_int x)
let of_float x = Sexp.atom (string_of_float x)
let of_bool x = Sexp.atom (string_of_bool x)
let of_unit = Sexp.list []
let of_list l = Sexp.list l
let of_rev_list l = Sexp.list (List.rev l)
let of_pair (x, y) = Sexp.list [ x; y ]
let of_triple (x, y, z) = Sexp.list [ x; y; z ]
let of_quad (x, y, z, u) = Sexp.list [ x; y; z; u ]
let of_variant name args = Sexp.list (Sexp.atom name :: args)
let of_field name t = Sexp.list [ Sexp.atom name; t ]
let of_record l = Sexp.list (List.map (fun (n, x) -> of_field n x) l)
(** {3 Printing} *)
let rec to_buf b t =
Sexp.match_ t
~atom:(fun s -> Printf.bprintf b "%d:%s" (String.length s) s)
~list:(function
| [] -> Buffer.add_string b "()"
| [ x ] -> Printf.bprintf b "(%a)" to_buf x
| l ->
Buffer.add_char b '(';
List.iter (to_buf b) l;
Buffer.add_char b ')')
let to_string t =
let b = Buffer.create 128 in
to_buf b t;
Buffer.contents b
let rec pp_noindent fmt t =
Sexp.match_ t
~atom:(fun s -> Format.fprintf fmt "%d:%s" (String.length s) s)
~list:(function
| [] -> Format.pp_print_string fmt "()"
| [ x ] -> Format.fprintf fmt "(%a)" pp_noindent x
| l ->
Format.fprintf fmt "(";
List.iter (pp_noindent fmt) l;
Format.fprintf fmt ")")
let pp = pp_noindent
let rec to_chan oc t =
Sexp.match_ t
~atom:(fun s -> Printf.fprintf oc "%d:%s" (String.length s) s)
~list:(function
| [] -> output_string oc "()"
| [ x ] -> Printf.fprintf oc "(%a)" to_chan x
| l ->
output_char oc '(';
List.iter (to_chan oc) l;
output_char oc ')')
let to_file_iter filename iter =
_with_out filename (fun oc -> iter (fun t -> to_chan oc t))
let to_file filename t = to_file_iter filename (fun k -> k t)
(** {3 Parsing} *)
module type INPUT = sig
exception EOF
val read_char : unit -> char
val read_string : int -> string
end
module Decoder (I : INPUT) = struct
let[@inline] is_num_ c =
Char.code c >= Char.code '0' && Char.code c <= Char.code '9'
let[@inline] as_num_ c = Char.code c - Char.code '0'
let next_ () : sexp or_error * bool =
let rec read_string_len n =
match I.read_char () with
| c when is_num_ c -> read_string_len ((n * 10) + as_num_ c)
| ':' ->
let s = I.read_string n in
atom s
| _ -> failwith "expected string length"
and eat_colon () =
match I.read_char () with
| ':' -> ()
| _ -> failwith "expected ':'"
and read_in_paren acc =
match I.read_char () with
| ')' -> list (List.rev acc)
| c when is_num_ c ->
let sexp = read_string_len (as_num_ c) in
read_in_paren (sexp :: acc)
| '(' ->
let sexp = read_in_paren [] in
read_in_paren (sexp :: acc)
| _ -> failwith "expected list of sexprs"
in
try
match I.read_char () with
| exception I.EOF -> Error "unexpected EOF", true
| '(' -> Ok (read_in_paren []), false
| '0' ->
eat_colon ();
Ok (atom ""), false
| c when is_num_ c -> Ok (read_string_len (as_num_ c)), false
| _ -> Error "unexpected char, expected toplevel sexpr", false
with Failure e -> Error e, false
let to_list () : _ or_error =
let rec iter acc =
match next_ () with
| Error _, true -> Ok (List.rev acc)
| Ok x, _ -> iter (x :: acc)
| (Error _ as res), _ -> res
in
try iter [] with e -> Error (Printexc.to_string e)
let[@inline] next_or_error () : _ or_error = fst (next_ ())
end
[@@inline]
module Decoder_str (X : sig
val s : string
end) =
Decoder (struct
exception EOF
let i = ref 0
let n = String.length X.s
let read_char () =
if !i >= n then raise_notrace EOF;
let c = String.unsafe_get X.s !i in
incr i;
c
let read_string len =
if !i + len > n then raise_notrace EOF;
let res = String.sub X.s !i len in
i := !i + len;
res
end)
[@@inline]
let parse_string s : t or_error =
let module D = Decoder_str (struct
let s = s
end) in
D.next_or_error ()
let parse_string_list s : t list or_error =
let module D = Decoder_str (struct
let s = s
end) in
D.to_list ()
module Decoder_ic (X : sig
val ic : in_channel
end) =
Decoder (struct
exception EOF = End_of_file
let[@inline] read_char () = input_char X.ic
let read_string n =
match n with
| 0 -> ""
| 1 -> String.make 1 (read_char ())
| _ ->
let buf = Bytes.make n '\000' in
let i = ref 0 in
while !i < n do
let len = input X.ic buf !i (n - !i) in
i := !i + len
done;
Bytes.unsafe_to_string buf
end)
[@@inline]
let parse_chan_ ?file ic : sexp or_error =
let module D = Decoder_ic (struct
let ic = ic
end) in
match D.next_or_error (), file with
| Error s, Some file -> Error (Printf.sprintf "%s in '%s'" s file)
| r, _ -> r
let parse_chan_list_ ?file ic =
let module D = Decoder_ic (struct
let ic = ic
end) in
match D.to_list (), file with
| Error s, Some file -> Error (Printf.sprintf "%s in '%s'" s file)
| r, _ -> r
let parse_chan ic = parse_chan_ ic
let parse_chan_list ic = parse_chan_list_ ic
let parse_chan_gen ic =
let module D = Decoder_ic (struct
let ic = ic
end) in
fun () ->
match D.next_ () with
| _, true -> None
| Error e, _ -> Some (Error e)
| Ok x, _ -> Some (Ok x)
let parse_file filename = _with_in filename (parse_chan_ ~file:filename)
let parse_file_list filename =
_with_in filename (parse_chan_list_ ~file:filename)
end
type t =
[ `Atom of string
| `List of t list
]
let rec equal a b =
match a, b with
| `Atom s1, `Atom s2 -> equal_string s1 s2
| `List l1, `List l2 ->
(try List.for_all2 equal l1 l2 with Invalid_argument _ -> false)
| `Atom _, _ | `List _, _ -> false
let rec compare_list a b =
match a, b with
| [], [] -> 0
| [], _ :: _ -> -1
| _ :: _, [] -> 1
| x :: xs, y :: ys ->
(match compare x y with
| 0 -> compare_list xs ys
| c -> c)
and compare a b =
match a, b with
| `Atom s1, `Atom s2 -> compare_string s1 s2
| `List l1, `List l2 -> compare_list l1 l2
| `Atom _, _ -> -1
| `List _, _ -> 1
module Basic_ = struct
type nonrec t = t
let atom x = `Atom x
let list x = `List x
let match_ x ~atom ~list =
match x with
| `Atom x -> atom x
| `List l -> list l
end
include (Make (Basic_) : S with type t := t)