package dream

  1. Overview
  2. Docs

Source file log.ml

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
(* This file is part of Dream, released under the MIT license. See LICENSE.md
   for details, or visit https://github.com/aantron/dream.

   Copyright 2021 Anton Bachin *)



(* Among other things, this module wraps the Logs library so as to prepend
   request ids to log messages.

   However, instead of prepending the id at the front end of Logs, in the
   wrappers, we prepend the id at the back end instead - in the reporter. The
   rationale for this is that we want to (try to) prepend the id even to strings
   that don't come from Dream or the user's Dream app, and thus *definitely* do
   not call this module's wrappers.

   The wrappers try to get the request id from their argument ~request, and pass
   it down to the reporter in a Logs tag.

   The reporter reads the tag and uses that request id if it is available. If
   the request id is not available, it is because the log message comes from a
   point in the Dream app where an id has not been assigned to the request, or
   because the log message comes from another dependency (or a sloppy call
   site!). In that case, the reporter tries to retrieve the id from the
   promise-chain-local storage of Lwt.

   This is sufficient for attaching a request id to most log messages, in
   practice. *)

module Message = Dream_pure.Message
module Method = Dream_pure.Method
module Status = Dream_pure.Status



type log_level = [
  | `Error
  | `Warning
  | `Info
  | `Debug
]



(* The logging middleware assigns request ids to requests, and tries to show
   them in the logs. The scheme works as follows:

   - Request ids are strings stored in request-local variables.
   - The automatically assigned request ids are taken from a simple global
     sequence.
   - The user can override the automatic request id by assigning a request id
     in a middleware that runs before the logger. User-provided request ids can
     be per-thread, can come from a proxy header, etc.
   - The logger makes a best effort to forward the request id to all logging
     statements that are being formatted. If the ~request argument is provided
     during a logging call, that request's id is shown. To handle all other
     cases, the logger puts the request's id into an Lwt sequence-associated
     storage key, and the log message formatter tries to get it from there. *)
(* TODO Necessary helpers for the user setting the request id are not yet
   exposed in the API, pending some other refactoring (request mutability). *)

let request_id_label = "dream.request_id"

(* Logs library tag uesd to pass an id from a request provided through
   ~request. *)
let logs_lib_tag : string Logs.Tag.def =
  Logs.Tag.def
    request_id_label
    Format.pp_print_string

(* Lwt sequence-associated storage key used to pass request ids for use when
   ~request is not provided. *)
let id_lwt_key : string Lwt.key =
  Lwt.new_key ()

(* The actual request id "field" associated with each request by the logger. If
   this field is missing, the logger assigns the request a fresh id. *)
let id_field =
  Message.new_field
    ~name:request_id_label
    ~show_value:(fun id -> id)
    ()

(* Makes a best-effort attempt to retrieve the request id. *)
let get_request_id ?request () =
  let request_id =
    match request with
    | None -> None
    | Some request -> Message.field request id_field
  in
  match request_id with
  | Some _ -> request_id
  | None -> Lwt.get id_lwt_key

(* The current state of the request id sequence. *)
let last_id =
  ref 0



(* TODO Nice logging for multiline strings? *)
(* The "back end." I inlined several examples from the Logs, Logs_lwt, and Fmt
   docs into each other, and modified the result, to arrive at this function.
   See those docs for the meanings of the various helpers and values.

   The reporter needs to be suspended in a function because Dream sets up the
   logger lazily; it doesn't query the output streams for whether they are TTYs
   until needed. Setting up the reporter before TTY checking will cause it to
   not output color. *)
let reporter ~now () =

  (* Format into an internal buffer. *)
  let buffer = Buffer.create 512 in
  let formatter = Fmt.with_buffer ~like:Fmt.stderr buffer in
  let flush () =
    let message = Buffer.contents buffer in
    Buffer.reset buffer;
    message
  in

  (* Gets called by Logs for each log call that passes its level threshold.
     ~over is to be called when the I/O underlying the log operation is fully
     complete. In practice, since most call sites are not using Lwt, they will
     continue executing anyway. This means that the message must be formatted
     and the buffer flushed before doing anything asynchronous, so that
     subsequent logging operations don't get into the same generation of the
     buffer.

     The user's_callback argument is not exactly the user's callback - it's the
     callback that got wrapped in function source (the "front end") below. That
     wrapper is the actual user's callback, and it calls user's_callback. *)
  let report src level ~over k user's_callback =

    let level_style, level =
      match level with
      | Logs.App ->     `White,   "     "
      | Logs.Error ->   `Red,     "ERROR"
      | Logs.Warning -> `Yellow,  " WARN"
      | Logs.Info ->    `Green,   " INFO"
      | Logs.Debug ->   `Blue,    "DEBUG"
    in

    let write _ =
      (* Get the formatted message out of the buffer right away, because we are
         doing Lwt operations next, and the caller might not wait. *)
      let message = flush () in

      (* Write the message. *)
      prerr_string message;
      Stdlib.flush stderr;
      over ();
      k ()
    in

    (* Call the user's callback to get the actual message and trigger
       formatting, and, eventually, writing. The wrappers don't use the ?header
       argument, so we ignore it. *)
    user's_callback @@ fun ?header ?tags format_and_arguments ->
      ignore header;

      (* Format the current local time. For the millisecond fraction, be careful
         of rounding 999.5+ to 1000 on output. *)
      let time =
        let unix_time = now () in
        let time = Option.get (Ptime.of_float_s unix_time) in
        let fraction =
          fst (modf unix_time) *. 1000. in
        let clamped_fraction =
          if fraction > 999. then 999.
          else fraction
        in
        let ((y, m, d), ((hh, mm, ss), _tz_offset_s)) =
          Ptime.to_date_time time in
        Printf.sprintf "%02i.%02i.%02i %02i:%02i:%02i.%03.0f"
          d m (y mod 100)
          hh mm ss clamped_fraction
      in

      (* Format the source name column. It is the right-aligned log source name,
         clipped to the column width. If the source is the default application
         source, leave the column empty. *)
      let source =
        let width = 15 in
        if Logs.Src.name src = Logs.Src.name Logs.default then
          String.make width ' '
        else
          let name = Logs.Src.name src in
          if String.length name > width then
            String.sub name (String.length name - width) width
          else
            (String.make (width - String.length name) ' ') ^ name
      in
      let source_prefix, source =
        try
          let dot_index = String.rindex source '.' + 1 in
          String.sub source 0 dot_index,
          String.sub source dot_index (String.length source - dot_index)
        with Not_found ->
          "", source
      in

      (* Check if a request id is available in the tags passed from the front
         end. If not, try to get it from the promise-chain-local storage. If
         we end up with a request id, format it. *)
      let request_id_from_tags =
        match tags with
        | None -> None
        | Some tags ->
          Logs.Tag.find logs_lib_tag tags
      in

      let request_id =
        match request_id_from_tags with
        | Some _ -> request_id_from_tags
        | None -> get_request_id ()
      in

      let request_id, request_style =
        match request_id with
        | Some "" | None -> "", `White
        | Some request_id ->
          (* The last byte of the request id is basically always going to be a
             digit, growing incrementally, so we can use the parity of its
             ASCII code to stripe the requests in the log. *)
          let last_byte = request_id.[String.length request_id - 1] in
          let color =
            if (Char.code last_byte) land 1 = 0 then
              `Cyan
            else
              `Magenta
          in
          " REQ " ^ request_id, color
      in

      (* The formatting proper. *)
      Format.kfprintf write formatter
        ("%a %a%s %a%a @[" ^^ format_and_arguments ^^ "@]@.")
        Fmt.(styled `Faint string) time
        Fmt.(styled `White string) source_prefix source
        Fmt.(styled level_style string) level
        Fmt.(styled request_style (styled `Italic string)) request_id
  in

  {Logs.report}



(* Lazy initialization upon first use or call to initialize. *)
let enable =
  ref true

let level =
  ref Logs.Info

let custom_log_levels : (string * Logs.level) list ref =
  ref []

let sources : (string * Logs.src) list ref =
  ref []

let set_printexc =
  ref true

let set_async_exception_hook =
  ref true

let _initialized = ref None

let to_logs_level l =
  match l with
  | `Error -> Logs.Error
  | `Warning -> Logs.Warning
  | `Info -> Logs.Info
  | `Debug -> Logs.Debug

exception Logs_are_not_initialized

let setup_logs =
  "\nTo initialize logs with a default reporter, and set up Dream, \
   do the following:\
   \n  If you are using MirageOS, use the Dream device in config.ml
   \n  If you are using Lwt/Unix, execute `Dream.log_initialize ()`
   \n"

let () = Printexc.register_printer @@ function
  | Logs_are_not_initialized ->
    Some ("The default logger is not yet initialized. " ^ setup_logs)
  | _ -> None

let initialized () : [ `Initialized ] =
  match !_initialized with
  | None -> raise Logs_are_not_initialized
  | Some v -> Lazy.force v

(* The "front end." *)
type ('a, 'b) conditional_log =
  ((?request:Message.request ->
   ('a, Stdlib.Format.formatter, unit, 'b) Stdlib.format4 -> 'a) -> 'b) ->
    unit

type sub_log = {
  error : 'a. ('a, unit) conditional_log;
  warning : 'a. ('a, unit) conditional_log;
  info : 'a. ('a, unit) conditional_log;
  debug : 'a. ('a, unit) conditional_log;
}

let sub_log ?level:level_ name =
  (* This creates a wrapper, as described above. The wrapper forwards to a
     logger of the Logs library, but instead of passing the formatter m to the
     user's callback, it passes a formatter m', which is like m, but lacks a
     ?tags argument. It has a ?request argument instead. If ~request is given,
     m' immediately tries to retrieve the request id, put it into a Logs tag,
     and call Logs' m with the user's formatting arguments and the tag. *)
  let forward ~(destination_log : _ Logs.log) user's_k =
    let `Initialized = initialized () in

    destination_log (fun log ->
      user's_k (fun ?request format_and_arguments ->
        let tags =
          match request with
          | None -> Logs.Tag.empty
          | Some request ->
            match get_request_id ~request () with
            | None -> Logs.Tag.empty
            | Some request_id ->
              Logs.Tag.add logs_lib_tag request_id Logs.Tag.empty
        in
        log ~tags format_and_arguments))
  in

  let level =
    List.find Option.is_some [
      Option.map to_logs_level level_;
      List.assoc_opt name !custom_log_levels;
      Some !level
    ] in

  (* Create the actual Logs source, and then wrap all the interesting
     functions. *)
  let src = Logs.Src.create name in
  let (module Log) = Logs.src_log src in
  Logs.Src.set_level src level;
  custom_log_levels :=
    (name, Option.get level)::(List.remove_assoc name !custom_log_levels);
  sources := (name, src) :: (List.remove_assoc name !sources);

  {
    error =   (fun k -> forward ~destination_log:Log.err   k);
    warning = (fun k -> forward ~destination_log:Log.warn  k);
    info =    (fun k -> forward ~destination_log:Log.info  k);
    debug =   (fun k -> forward ~destination_log:Log.debug k);
  }



let convenience_log format_and_arguments =
  Fmt.kstr
    (fun message ->
      let `Initialized = initialized () in
      Logs.app (fun log -> log "%s" message))
    format_and_arguments
  (* Logs.app (fun log -> log format_and_arguments) *)
  (* let report = Logs.((reporter ()).report) in
  report Logs.default Logs.App ~over:ignore ignore format_and_arguments *)



(* A helper used in several places. *)
let iter_backtrace f backtrace =
  backtrace
  |> String.split_on_char '\n'
  |> List.filter (fun line -> line <> "")
  |> List.iter f



(* Use the above function to create a log source for Log's own middleware, the
   same way any other middleware would. *)
let log =
  sub_log "dream.logger"



let set_up_exception_hook () =
  if !set_async_exception_hook then begin
    set_async_exception_hook := false;
    Lwt.async_exception_hook := fun exn ->
      let backtrace = Printexc.get_backtrace () in
      log.error (fun log -> log "Async exception: %s" (Printexc.to_string exn));
      backtrace
      |> iter_backtrace (fun line -> log.error (fun log -> log "%s" line))
  end

let initialize_log
    ?(backtraces = true)
    ?(async_exception_hook = true)
    ?level:level_
    ?enable:(enable_ = true)
    () =

  if backtraces then
    Printexc.record_backtrace true;
  set_printexc := false;

  if async_exception_hook then
    set_up_exception_hook ();
  set_async_exception_hook := false;

  let level_ =
    Option.map to_logs_level level_
    |> Option.value ~default:Logs.Info in

  enable := enable_;
  level := level_;
  let `Initialized = initialized () in
  ()

let set_log_level name level =
  (* If logging hasn't been initialized, trigger this so that
     configuration of log levels can proceed. *)
  let `Initialized = initialized () in
  let level = to_logs_level level in
  custom_log_levels :=
    (name, level)::(List.remove_assoc name !custom_log_levels);
  let src = List.assoc_opt name !sources in
  Option.iter (fun s -> Logs.Src.set_level s (Some level)) src

let fd_field : int Message.field =
  Message.new_field ~name:"dream.fd" ~show_value:string_of_int ()

module Make (Pclock : Mirage_clock.PCLOCK) =
struct
  let now () =
    Ptime.to_float_s (Ptime.v (Pclock.now_d_ps ()))

  let initializer_ ~setup_outputs = lazy begin
    if !enable then begin
      setup_outputs () ;
      Logs.set_level ~all:true (Some !level);
      !custom_log_levels |> List.iter (fun (name, level) ->
        List.assoc_opt name !sources
        |> Option.iter (fun source -> Logs.Src.set_level source (Some level)));
      Logs.set_reporter (reporter ~now ())
    end ;
    `Initialized
  end

  let set = ref false

  let initialize ~setup_outputs =
    if !set then Logs.debug (fun log -> log
      "Dream__log.initialize has already been called, ignoring this call.")
    else begin
      (try
        let `Initialized = initialized () in
        Format.eprintf
          "Dream__log.initialized has already been set, check that this call \
          is intentional";
        with
          Logs_are_not_initialized -> ());
      set := true;
      _initialized := Some (initializer_ ~setup_outputs)
    end

  (* The request logging middleware. *)
  let logger next_handler request =

    let start = now () in

    (* Turn on backtrace recording. *)
    if !set_printexc then begin
      Printexc.record_backtrace true;
      set_printexc := false
    end;

    (* Get the request's id or assign a new one. *)
    let id =
      match Message.field request id_field with
      | Some id -> id
      | None ->
        last_id := !last_id + 1;
        let id = string_of_int !last_id in
        Message.set_field request id_field id;
        id
    in

    let fd_string =
      match Message.field request fd_field with
      | None -> ""
      | Some fd -> " fd " ^ (string_of_int fd)
    in

    (* Identify the request in the log. *)
    let user_agent =
      Message.headers request "User-Agent"
      |> String.concat " "
    in

    log.info (fun log ->
      log ~request "%s %s %s%s %s"
        (Method.method_to_string (Message.method_ request))
        (Message.target request)
        (Helpers.client request)
        fd_string
        user_agent);

    (* Call the rest of the app. *)
    Lwt.try_bind
      (fun () ->
        Lwt.with_value id_lwt_key (Some id) (fun () ->
          next_handler request))
      (fun response ->
        (* Log the elapsed time. If the response is a redirection, log the
           target. *)
        let location =
          if Status.is_redirection (Message.status response) then
            match Message.header response "Location" with
            | Some location -> " " ^ location
            | None -> ""
          else ""
        in

        let status = Message.status response in

        let report :
          (?request:Message.request ->
            ('a, Format.formatter, unit, 'b) format4 -> 'a) -> 'b =
            fun log ->
          let elapsed = now () -. start in
          log ~request "%i%s in %.0f μs"
            (Status.status_to_int status)
            location
            (elapsed *. 1e6)
        in

        begin
          if Status.is_server_error status then
            log.error report
          else
            if Status.is_client_error status then
              log.warning report
            else
              log.info report
        end;

        Lwt.return response)

      (fun exn ->
        let backtrace = Printexc.get_backtrace () in
        (* In case of exception, log the exception. We alsp log the backtrace
           here, even though it is likely to be redundant, because some OCaml
           libraries install exception printers that will clobber the backtrace
           right during Printexc.to_string! *)
        log.warning (fun log ->
          log ~request "Aborted by: %s" (Printexc.to_string exn));

        backtrace
        |> iter_backtrace (fun line -> log.warning (fun log -> log "%s" line));

        Lwt.fail exn)
end



(* TODO DOC Include logging itself in the timing. Or? Isn't that pointless?
   End-to -end timing should include the HTTP parser as well. The logger
   provides much more useful information if it helps the user optimize the app.
   Sp, should probably craete some helpers for the user to do end-to-end timing
   of the HTTP server and document how to use them. *)
(* TODO DOC Add docs on how to avoid OCamlbuild dep. *)
(* TODO DOC why it's good to use the initializer early. *)

(* TODO LATER implement fire. *)
(* TODO LATER In case of streamed bodies, it is useful for the logger to be told
   by the HTTP layer when streaming was actually completed. *)
OCaml

Innovation. Community. Security.