package albatross

  1. Overview
  2. Docs

Source file vmm_vmmd.ml

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
(* (c) 2017, 2018 Hannes Mehnert, all rights reserved *)

open Vmm_core

let ( let* ) = Result.bind

type 'a t = {
  console_counter : int64 ;
  stats_counter : int64 ;
  resources : Vmm_resources.t ;
  waiters : 'a String_map.t ;
  restarting : String_set.t ;
}
(* the life of a unikernel
   - once started, if restart-on-fail is enabled, a waiter will be add to t.waiters
   - if the waitpid () returns (i.e. unikernel has finished execution),
     a lookup in the t.waiters map will potentially result in a Lwt.task to be notified
   - if there is such a task, for this brief moment the t.restarting set will
     be populated with the unikernel name. this allows to destroy boot-looping
     unikernels (see #39)
   - once the restart-on-fail task is triggered (executing), it will first look
     whether the t.restarting set still contains the unikernel name, and then
     remove that name from t.restarting and create the unikernel again

   - the killall command (on albatross_daemon restart) uses the waiters map to
     wait for all unikernels to have exited and resources are cleaned up (see
     #37, since otherwise tap devices are kept around)
*)

let in_shutdown = ref false

let remove_resources t name =
  let resources = match Vmm_resources.remove_vm t.resources name with
    | Error (`Msg e) ->
      Logs.warn (fun m -> m "%s while removing vm %a from resources" e Name.pp name) ;
      t.resources
    | Ok resources -> resources
  in
  { t with resources }

let dump_unikernels t =
  let unikernels = Vmm_trie.all t.resources.Vmm_resources.unikernels in
  let trie = List.fold_left (fun t (name, unik) ->
      fst @@ Vmm_trie.insert name unik.Unikernel.config t)
      Vmm_trie.empty unikernels
  in
  let data = Vmm_asn.unikernels_to_cstruct trie in
  match Vmm_unix.dump data with
  | Error (`Msg msg) -> Logs.err (fun m -> m "failed to dump unikernels: %s" msg)
  | Ok () -> Logs.info (fun m -> m "dumped current state")

let waiter t id =
  let t = remove_resources t id in
  let name = Name.to_string id in
  if not !in_shutdown then dump_unikernels t ;
  match String_map.find_opt name t.waiters with
  | None -> t, None
  | Some waiter ->
    let waiters = String_map.remove name t.waiters in
    let restarting = String_set.add name t.restarting in
    { t with waiters ; restarting }, Some waiter

let register t id create =
  let name = Name.to_string id in
  let task, waiter = create () in
  { t with waiters = String_map.add name waiter t.waiters }, task

let register_restart t id create =
  let name = Name.to_string id in
  match String_map.find_opt name t.waiters with
  | Some _ -> Logs.err (fun m -> m "restart attempted to overwrite waiter"); None
  | _ -> Some (register t id create)

let may_restart t id =
  let n = Name.to_string id in
  if String_set.mem n t.restarting then
    let restarting = String_set.remove n t.restarting in
    { t with restarting }, true
  else
    t, false

let stop_create t id =
  let name = Name.to_string id in
  match String_map.find_opt name t.waiters with
  | None ->
    let t, may = may_restart t id in
    if may then
      Ok (t, `End (`Success (`String "destroyed: removed from restarting")))
    else
      Error (`Msg "destroy: not found")
  | Some _ ->
    let waiters = String_map.remove name t.waiters in
    let t = { t with waiters } in
    Ok (t, `End (`Success (`String "destroyed: removed waiter")))

let killall t create =
  let vms = Vmm_trie.all t.resources.Vmm_resources.unikernels in
  in_shutdown := true ;
  let t, xs = List.fold_left
      (fun (t, acc) (id, _) ->
         let (t, a) = register t id create in
         (t, a :: acc))
      (t, []) vms in
  List.iter Vmm_unix.destroy (List.map snd vms) ;
  t, xs

let empty = {
  console_counter = 1L ;
  stats_counter = 1L ;
  resources = Vmm_resources.empty ;
  waiters = String_map.empty ;
  restarting = String_set.empty ;
}

let init_block_devices t =
  match Vmm_unix.find_block_devices () with
  | Error (`Msg msg) ->
    Logs.warn (fun m -> m "couldn't find block devices %s" msg) ;
    t
  | Ok devs ->
    let resources =
      List.fold_left (fun r (id, size) ->
          match Vmm_resources.insert_block r id size with
          | Error (`Msg msg) ->
            Logs.err (fun m -> m "couldn't insert block device %s (%dMB): %s" (Name.to_string id) size msg) ;
            r
          | Ok r -> r)
        t.resources devs
    in
    { t with resources }

type 'a create =
  Vmm_commands.wire *
  ('a t -> ('a t * Vmm_commands.wire * Vmm_commands.res * Name.t * Unikernel.t, [ `Msg of string ]) result) *
  (unit -> Vmm_commands.res)

let restore_unikernels () =
  match Vmm_unix.restore () with
  | Error `NoFile ->
    Logs.warn (fun m -> m "no state dump found, starting with no unikernels") ;
    Ok Vmm_trie.empty
  | Error (`Msg msg) -> Error (`Msg ("while reading state: " ^ msg))
  | Ok data ->
    match Vmm_asn.unikernels_of_cstruct data with
    | Error (`Msg msg) -> Error (`Msg ("couldn't parse state: " ^ msg))
    | Ok unikernels ->
      Logs.info (fun m -> m "restored %d unikernels" (List.length (Vmm_trie.all unikernels))) ;
      Ok unikernels

let setup_stats t name vm =
  let stat_out =
    let name = match Vmm_unix.vm_device vm with
      | Error _ -> ""
      | Ok name -> name
    and ifs = Unikernel.(List.combine (List.map (fun (x,_,_) -> x) vm.config.bridges) vm.taps)
    in
    `Stats_add (name, vm.Unikernel.pid, ifs)
  in
  let header = Vmm_commands.header ~sequence:t.stats_counter name in
  let t = { t with stats_counter = Int64.succ t.stats_counter } in
  t, (header, `Command (`Stats_cmd stat_out))

let remove_stats t name =
  let header = Vmm_commands.header ~sequence:t.stats_counter name in
  let t = { t with stats_counter = Int64.succ t.stats_counter } in
  (t, (header, `Command (`Stats_cmd `Stats_remove)))

let handle_create t name vm_config =
  let* () =
    match Vmm_resources.find_vm t.resources name with
    | Some _ -> Error (`Msg "VM with same name is already running")
    | None -> Ok ()
  in
  Logs.debug (fun m -> m "now checking resource policies") ;
  let* () = Vmm_resources.check_vm t.resources name vm_config in
  (* prepare VM: save VM image to disk, create fifo, ... *)
  let* taps, digest = Vmm_unix.prepare name vm_config in
  let pp_tap ppf (a, b, mac) =
    Fmt.pf ppf "%s -> %s%a" a b Fmt.(option ((any "@") ++ Macaddr.pp)) mac
  in
  Logs.debug (fun m -> m "prepared vm with taps %a"
                 Fmt.(list ~sep:(any ",@ ") pp_tap) taps) ;
  let cons_out =
    let header = Vmm_commands.header ~sequence:t.console_counter name in
    (header, `Command (`Console_cmd `Console_add))
  in
  let success t =
    (* actually execute the vm:
       - check for safety that executing it would not exceed any resources
       - execute it
       - update resources
       --> if either the first or second fails, then the fail continuation
           below needs to be called *)
    let* () = Vmm_resources.check_vm t.resources name vm_config in
    let block_devices =
      List.map (fun (n, device, sector_size) ->
          n, Name.block_name name (Option.value ~default:n device), sector_size)
        vm_config.Unikernel.block_devices
    in
    let* vm = Vmm_unix.exec name vm_config taps block_devices digest in
    Logs.debug (fun m -> m "exec()ed vm") ;
    let resources = Vmm_resources.insert_vm t.resources name vm in
    let t = { t with resources } in
    dump_unikernels t ;
    Logs.info (fun m -> m "created %a: %a" Name.pp name Unikernel.pp vm);
    let t, stat_out = setup_stats t name vm in
    Ok (t, stat_out, `Success (`String "created VM"), name, vm)
  and fail () =
    match Vmm_unix.free_system_resources name (List.map (fun (_,tap,_) -> tap) taps) with
    | Ok () -> `Failure "could not create VM: console failed"
    | Error (`Msg msg) ->
      let m = "could not create VM: console failed, and also " ^ msg ^ " while cleaning resources" in
      `Failure m
  in
  Ok ({ t with console_counter = Int64.succ t.console_counter },
      (cons_out, success, fail))

let handle_shutdown t name vm r =
  (match Vmm_unix.free_system_resources name vm.Unikernel.taps with
   | Ok () -> ()
   | Error (`Msg e) ->
     Logs.err (fun m -> m "%s while shutdown vm %a" e Unikernel.pp vm));
  Logs.info (fun m -> m "unikernel %a (PID %d) stopped with %a"
                Name.pp name vm.Unikernel.pid pp_process_exit r);
  let t, stat_out = remove_stats t name in
  (t, stat_out)

let handle_policy_cmd t id =
  let path = Name.path id in
  (match Name.name id with
   | None -> ()
   | Some x ->
     Logs.warn (fun m -> m "policy command with non-empty name part %S in %a"
                   x Name.pp id));
  function
  | `Policy_remove ->
    Logs.debug (fun m -> m "remove policy %a" Name.pp id) ;
    let* resources = Vmm_resources.remove_policy t.resources path in
    Ok ({ t with resources }, `End (`Success (`String "removed policy")))
  | `Policy_add policy ->
    Logs.debug (fun m -> m "insert policy %a" Name.pp id) ;
    let same_policy = match Vmm_resources.find_policy t.resources path with
      | None -> false
      | Some p' -> Policy.equal policy p'
    in
    if same_policy then
      Ok (t, `Loop (`Success (`String "no modification of policy")))
    else
      let* resources = Vmm_resources.insert_policy t.resources path policy in
      Ok ({ t with resources }, `Loop (`Success (`String "added policy")))
  | `Policy_info ->
    Logs.debug (fun m -> m "policy %a" Name.pp id) ;
    let policies =
      Vmm_trie.fold path t.resources.Vmm_resources.policies
        (fun prefix policy policies-> (prefix, policy) :: policies)
        []
    in
    Ok (t, `End (`Success (`Policies policies)))

let handle_unikernel_cmd t id = function
  | `Old_unikernel_info1 ->
    Logs.debug (fun m -> m "old info1 %a" Name.pp id) ;
    let empty_image vm = { vm.Unikernel.config with image = Cstruct.empty } in
    let vms =
      match Name.name id with
      | None ->
        Vmm_trie.fold (Name.path id) t.resources.Vmm_resources.unikernels
          (fun id vm vms -> (id, empty_image vm) :: vms) []
      | Some _ ->
        Option.fold ~none:[] ~some:(fun vm -> [ id, empty_image vm ])
          (Vmm_trie.find id t.resources.Vmm_resources.unikernels)
    in
    Ok (t, `End (`Success (`Old_unikernels vms)))
  | `Old_unikernel_get ->
    Logs.debug (fun m -> m "old get %a" Name.pp id) ;
    begin match Vmm_trie.find id t.resources.Vmm_resources.unikernels with
      | None -> Error (`Msg "get: no unikernel found")
      | Some u ->
        Ok (t, `End (`Success (`Old_unikernels [ (id, u.Unikernel.config) ])))
    end
  | `Old_unikernel_info2 ->
    Logs.debug (fun m -> m "old info2 %a" Name.pp id) ;
    let infos =
      match Name.name id with
      | None ->
        Vmm_trie.fold (Name.path id) t.resources.Vmm_resources.unikernels
          (fun id vm vms -> (id, Unikernel.info vm) :: vms) []
      | Some _ ->
        Option.fold ~none:[] ~some:(fun vm -> [ id, Unikernel.info vm ])
          (Vmm_trie.find id t.resources.Vmm_resources.unikernels)
    in
    Ok (t, `End (`Success (`Old_unikernel_info infos)))
  | `Unikernel_info ->
    Logs.debug (fun m -> m "info %a" Name.pp id) ;
    let infos =
      match Name.name id with
      | None ->
        Vmm_trie.fold (Name.path id) t.resources.Vmm_resources.unikernels
          (fun id vm vms -> (id, Unikernel.info vm) :: vms) []
      | Some _ ->
        Option.fold ~none:[] ~some:(fun vm -> [ id, Unikernel.info vm ])
          (Vmm_trie.find id t.resources.Vmm_resources.unikernels)
    in
    Ok (t, `End (`Success (`Unikernel_info infos)))
  | `Unikernel_get compress_level ->
    Logs.debug (fun m -> m "get %a" Name.pp id) ;
    begin match Vmm_trie.find id t.resources.Vmm_resources.unikernels with
      | None -> Error (`Msg "get: no unikernel found")
      | Some u ->
        let cfg = u.Unikernel.config in
        let img = cfg.Unikernel.image in
        let* compress, img =
          if cfg.Unikernel.compressed then
            if compress_level > 0 then
              Ok (true, img)
            else
              let* blob = Vmm_compress.uncompress_cs img in
              Ok (false, blob)
          else
          if compress_level = 0 then
            Ok (false, img)
          else
            Ok (true, Vmm_compress.compress_cs compress_level img)
        in
        let r = `Unikernel_image (compress, img) in
        Ok (t, `End (`Success r))
    end
  | `Unikernel_create vm_config -> Ok (t, `Create (id, vm_config))
  | `Unikernel_force_create vm_config ->
    begin
      let resources =
        match Vmm_resources.remove_vm t.resources id with
        | Error _ -> t.resources | Ok r -> r
      in
      let* () = Vmm_resources.check_vm resources id vm_config in
      match Vmm_resources.find_vm t.resources id with
      | None ->
        ignore (stop_create t id);
        Ok (t, `Create (id, vm_config))
      | Some vm ->
        (match Vmm_unix.destroy vm with
         | exception Unix.Unix_error _ -> ()
         | () -> ());
        Ok (t, `Wait_and_create (id, (id, vm_config)))
    end
  | `Unikernel_restart ->
    begin
      match Vmm_resources.find_vm t.resources id with
      | None -> stop_create t id
      | Some vm ->
        Ok (t, `Wait_and_create (id, (id, vm.Unikernel.config)))
    end
  | `Unikernel_destroy ->
    match Vmm_resources.find_vm t.resources id with
    | None -> stop_create t id
    | Some vm ->
      let answer =
        try
          Vmm_unix.destroy vm ; "destroyed unikernel"
        with
          Unix.Unix_error _ -> "kill failed"
      in
      let s ex =
        let data = Fmt.str "%a %s %a" Name.pp id answer pp_process_exit ex in
        `Success (`String data)
      in
      Ok (t, `Wait (id, s))

let handle_block_cmd t id = function
  | `Block_remove ->
    Logs.debug (fun m -> m "removing block %a" Name.pp id) ;
    begin match Vmm_resources.find_block t.resources id with
      | None -> Error (`Msg "remove block: not found")
      | Some (_, true) -> Error (`Msg "remove block: is in use")
      | Some (_, false) ->
        let* () = Vmm_unix.destroy_block id in
        let* resources = Vmm_resources.remove_block t.resources id in
        Ok ({ t with resources }, `End (`Success (`String "removed block")))
    end
  | `Block_add (size, compressed, data) ->
    begin
      Logs.debug (fun m -> m "insert block %a: %dMB (data: %a)"
                     Name.pp id size
                     Fmt.(option ~none:(any "none provided") int)
                     (Option.map Cstruct.length data));
      match Vmm_resources.find_block t.resources id with
      | Some _ -> Error (`Msg "block device with same name already exists")
      | None ->
        let* () = Vmm_resources.check_block t.resources id size in
        let* data =
          match data with
          | None -> Ok None
          | Some img ->
            let* img =
              if compressed then
                Vmm_compress.uncompress_cs img
              else
                Ok img
            in
            let* size_in_bytes = Vmm_unix.bytes_of_mb size in
            if size_in_bytes >= Cstruct.length img then
              Ok (Some img)
            else
              Error (`Msg "data exceeds block size")
        in
        let* () = Vmm_unix.create_block ?data id size in
        let* resources = Vmm_resources.insert_block t.resources id size in
        Ok ({ t with resources }, `End (`Success (`String "added block device")))
    end
  | `Block_set (compressed, data) ->
    begin match Vmm_resources.find_block t.resources id with
      | None -> Error (`Msg "set block: not found")
      | Some (_, true) -> Error (`Msg "set block: is in use")
      | Some (size, false) ->
        let* data =
          if compressed then
            Vmm_compress.uncompress_cs data
          else
            Ok data
        in
        let* size_in_bytes = Vmm_unix.bytes_of_mb size in
        let* () =
          if size_in_bytes >= Cstruct.length data then
            Ok ()
          else
            Error (`Msg "data exceeds block size")
        in
        let* () = Vmm_unix.destroy_block id in
        let* () = Vmm_unix.create_block ~data id size in
        Ok (t, `End (`Success (`String "set block device")))
    end
  | `Block_dump level ->
    begin match Vmm_resources.find_block t.resources id with
      | None -> Error (`Msg "dump block: not found")
      | Some (_, true) -> Error (`Msg "dump block: is in use")
      | Some (_, false) ->
        let* data = Vmm_unix.dump_block id in
        let compress, data =
          if level = 0 then
            false, data
          else
            true, Vmm_compress.compress_cs level data
        in
        Ok (t, `End (`Success (`Block_device_image (compress, data))))
    end
  | `Block_info ->
    Logs.debug (fun m -> m "block %a" Name.pp id) ;
    let blocks =
      match Name.name id with
      | None ->
        Vmm_trie.fold (Name.path id) t.resources.Vmm_resources.block_devices
          (fun prefix (size, active) blocks -> (prefix, size, active) :: blocks)
          []
      | Some _ ->
        Option.fold ~none:[] ~some:(fun (size, active) -> [ id, size, active ])
          (Vmm_trie.find id t.resources.Vmm_resources.block_devices)
    in
    Ok (t, `End (`Success (`Block_devices blocks)))

let handle_stats_initial t stats_counter =
  let t = { t with stats_counter = Int64.succ stats_counter } in
  let t, data =
    let unikernels = Vmm_trie.all t.resources.Vmm_resources.unikernels in
    List.fold_left (fun (t, acc) (name, vm) ->
        let t, out = setup_stats t name vm in
        (t, out :: acc))
      (t, []) unikernels
  in
  Ok (t, `Replace_stats (`Success `Empty, data))

let handle_command t (header, payload) =
  let msg_to_err = function
    | Ok x -> Ok x
    | Error (`Msg msg) ->
      Logs.err (fun m -> m "error while processing command: %s" msg) ;
      Error (`Failure msg)
  and id = header.Vmm_commands.name
  in
  msg_to_err (
    match payload with
    | `Command (`Policy_cmd pc) -> handle_policy_cmd t id pc
    | `Command (`Unikernel_cmd vc) -> handle_unikernel_cmd t id vc
    | `Command (`Block_cmd bc) -> handle_block_cmd t id bc
    | `Command (`Stats_cmd `Stats_initial) ->
      handle_stats_initial t header.Vmm_commands.sequence
    | _ ->
      Logs.err (fun m -> m "ignoring %a"
                   (Vmm_commands.pp_wire ~verbose:false) (header, payload)) ;
      Error (`Msg "unknown command"))
OCaml

Innovation. Community. Security.