package email_message

  1. Overview
  2. Docs
Legend:
Page
Library
Module
Module type
Parameter
Class
Class type
Source

Source file bigstring_shared.ml

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
module Stable = struct
  open! Core.Core_stable

  module V1 = struct
    type t = Core.Bigstring.Stable.V1.t_frozen [@@deriving sexp, bin_io, compare, hash]

    let equal = [%compare.equal: t]
  end
end

type t = Stable.V1.t [@@deriving sexp_of, compare, hash, equal]

open Core
open Poly
open Bigstring

let to_bigstring t = t
let of_bigstring t = t
let to_string_monoid t = String_monoid.of_bigstring t
let of_string_monoid t = String_monoid.to_bigstring t
let to_string t = to_string t
let of_string s = of_string s
let empty = Bigstring.create 0
let length t = Bigstring.length t

let sub ?pos ?len t =
  let pos, len =
    match pos, len with
    | None, None -> 0, length t
    | None, Some len -> 0, len
    | Some pos, None -> pos, length t - pos
    | Some pos, Some len -> pos, len
  in
  Bigstring.sub_shared ~pos ~len t
;;

let to_lexbuf t =
  let offset = ref 0 in
  let len = length t in
  Lexing.from_function (fun dst n ->
    let read = min n (len - !offset) in
    Bigstring.To_bytes.blit ~src:t ~src_pos:!offset ~len:read ~dst ~dst_pos:0;
    offset := !offset + read;
    read)
;;

let foldi t ~init ~f =
  let len = length t in
  let rec loop init pos =
    if pos >= len then init else loop (f pos init t.{pos}) (pos + 1)
  in
  loop init 0
;;

(* Copied from String.split_lines. *)
let iter_lines_rev t ~f =
  let back_up_at_newline ~t ~pos ~eol =
    pos := !pos - if !pos > 0 && get t (!pos - 1) = '\r' then 2 else 1;
    eol := !pos + 1
  in
  let n = length t in
  if n = 0
  then ()
  else (
    (* Invariant: [-1 <= pos < eol]. *)
    let pos = ref (n - 1) in
    let eol = ref n in
    (* We treat the end of the string specially, because if the string ends with a
       newline, we don't want an extra empty string at the end of the output. *)
    if get t !pos = '\n' then back_up_at_newline ~t ~pos ~eol;
    while !pos >= 0 do
      if get t !pos <> '\n'
      then decr pos
      else (
        (* Becuase [pos < eol], we know that [start <= eol]. *)
        let start = !pos + 1 in
        f (sub t ~pos:start ~len:(!eol - start));
        back_up_at_newline ~t ~pos ~eol)
    done;
    f (sub t ~pos:0 ~len:!eol))
;;

let split_lines t =
  let acc = ref [] in
  iter_lines_rev t ~f:(fun line -> acc := line :: !acc);
  !acc
;;

let lines_seq ?include_empty_last_line t =
  let open Sequence.Generator in
  let open Sequence.Generator.Let_syntax in
  let rec traverse ~sol ~pos =
    let prev_char_is_cr = pos <> 0 && get t (pos - 1) = '\r' in
    if pos = length t
    then
      if (* Safe because [length t > 0] *)
         Option.is_some include_empty_last_line || not (get t (pos - 1) = '\n')
      then (
        let len = pos - sol in
        let%bind () = yield (sub t ~pos:sol ~len) in
        return ())
      else return ()
    else if get t pos <> '\n'
    then traverse ~sol ~pos:(pos + 1)
    else (
      let len = pos - sol - if prev_char_is_cr then 1 else 0 in
      let%bind () = yield (sub t ~pos:sol ~len) in
      let pos' = pos + 1 in
      traverse ~sol:pos' ~pos:pos')
  in
  if length t = 0 then Sequence.empty else Sequence.Generator.run (traverse ~sol:0 ~pos:0)
;;

let iter_lines t ~f = Sequence.iter (lines_seq t) ~f

let%expect_test "split_lines and iter_lines" =
  let split_lines t = split_lines (of_string t) |> List.map ~f:to_string in
  let split_lines_via_iter_lines t =
    let acc = ref [] in
    iter_lines (of_string t) ~f:(fun line -> acc := line :: !acc);
    List.rev_map !acc ~f:to_string
  in
  let impls =
    [ "Bigstring.iter_lines_rev", split_lines
    ; "Bigstring.iter_lines", split_lines_via_iter_lines
    ; "String.split_lines", String.split_lines
    ]
  in
  List.iter
    ~f:(fun s ->
      let results = List.map impls ~f:(fun (desc, f) -> desc, f s) in
      let all_equal =
        List.dedup_and_sort results ~compare:(fun (_, r1) (_, r2) ->
          [%compare: string list] r1 r2)
        |> List.length
        |> Int.equal 1
      in
      if not all_equal
      then
        raise_s
          [%message
            "Mismatching implementations"
              ~input:(s : string)
              ~_:(results : (string * string list) list)])
    [ ""
    ; "\n"
    ; "a"
    ; "a\n"
    ; "a\nb"
    ; "a\nb\n"
    ; "a\n\n"
    ; "a\n\nb"
    ; "a\r\n\nb"
    ; "\ra\r\n\nb"
    ; "\ra\r\n\nb\r"
    ; "\ra\r\n\nb\r\n"
    ]
;;

let of_bigbuffer_volatile buffer =
  (* If this isn't done, the buffer might contain extra uninitialized characters *)
  Bigstring.sub_shared
    ~pos:0
    ~len:(Bigbuffer.length buffer)
    (Bigbuffer.volatile_contents buffer)
;;

let substr_index ?(pos = 0) t ~pattern =
  if length pattern = 0
  then Some pos
  else (
    let c = Bigstring.get pattern 0 in
    let last_index = Bigstring.length t - Bigstring.length pattern in
    let rec loop pos =
      if pos > last_index
      then None
      else (
        match Bigstring.find c t ~pos ~len:(last_index - pos + 1) with
        | None -> None
        | Some pos ->
          assert (pos <= last_index);
          let found_ = Bigstring.sub_shared t ~pos ~len:(Bigstring.length pattern) in
          if Bigstring.equal pattern found_ then Some pos else loop (pos + 1))
    in
    loop pos)
;;
OCaml

Innovation. Community. Security.