ligo/src/lib_shell/worker.ml

431 lines
15 KiB
OCaml
Raw Normal View History

2018-01-22 18:25:48 +04:00
(**************************************************************************)
(* *)
2018-02-06 00:17:03 +04:00
(* Copyright (c) 2014 - 2018. *)
2018-01-22 18:25:48 +04:00
(* Dynamic Ledger Solutions, Inc. <contact@tezos.com> *)
(* *)
(* All rights reserved. No warranty, explicit or implicit, provided. *)
(* *)
(**************************************************************************)
module type NAME = sig
val base : string list
type t
val encoding : t Data_encoding.t
val pp : Format.formatter -> t -> unit
end
module type EVENT = sig
type t
val level : t -> Logging.level
2018-01-25 14:32:51 +04:00
val encoding : t Data_encoding.t
2018-01-22 18:25:48 +04:00
val pp : Format.formatter -> t -> unit
end
module type REQUEST = sig
type 'a t
type view
val view : 'a t -> view
val encoding : view Data_encoding.t
val pp : Format.formatter -> view -> unit
end
module type TYPES = sig
type state
type parameters
type view
val view : state -> parameters -> view
val encoding : view Data_encoding.t
val pp : Format.formatter -> view -> unit
end
module Make
(Name : NAME)
(Event : EVENT)
(Request : REQUEST)
(Types : TYPES) = struct
let base_name = String.concat "." Name.base
type message = Message: 'a Request.t * 'a tzresult Lwt.u option -> message
type 'a queue and bounded and infinite
type dropbox
type _ buffer_kind =
| Queue : infinite queue buffer_kind
| Bounded : { size : int } -> bounded queue buffer_kind
| Dropbox :
{ merge : (dropbox t ->
any_request ->
any_request option ->
any_request option) }
-> dropbox buffer_kind
and any_request = Any_request : _ Request.t -> any_request
and _ buffer =
| Queue_buffer : (Time.t * message) Lwt_pipe.t -> infinite queue buffer
| Bounded_buffer : (Time.t * message) Lwt_pipe.t -> bounded queue buffer
| Dropbox_buffer : (Time.t * message) Lwt_dropbox.t -> dropbox buffer
and 'kind t = {
limits : Worker_types.limits ;
2018-01-22 18:25:48 +04:00
timeout : float option ;
parameters : Types.parameters ;
mutable (* only for init *) worker : unit Lwt.t ;
mutable (* only for init *) state : Types.state option ;
buffer : 'kind buffer ;
event_log : (Logging.level * Event.t Ring.t) list ;
2018-02-26 17:11:10 +04:00
logger : (module Logging.LOG) ;
2018-01-22 18:25:48 +04:00
canceler : Lwt_canceler.t ;
name : Name.t ;
id : int ;
mutable status : Worker_types.worker_status ;
2018-01-22 18:25:48 +04:00
mutable current_request : (Time.t * Time.t * Request.view) option ;
table : 'kind table ;
}
and 'kind table = {
buffer_kind : 'kind buffer_kind ;
mutable last_id : int ;
instances : (Name.t, 'kind t) Hashtbl.t ;
zombies : (int, 'kind t) Hashtbl.t
}
type error += Closed of Name.t
let () =
register_error_kind `Permanent
~id:("worker." ^ base_name ^ ".closed")
~title:("Worker " ^ base_name ^ " closed")
~description:
("An operation on a " ^ base_name ^
" worker could not complete \
before it was shut down.")
~pp: (fun ppf name ->
Format.fprintf ppf
"Worker %s[%a] has been shut down."
base_name Name.pp name)
Data_encoding.(obj1 (req "worker_id" Name.encoding))
2018-02-16 04:26:24 +04:00
(function Closed chain_id -> Some chain_id | _ -> None)
(fun chain_id -> Closed chain_id)
2018-01-22 18:25:48 +04:00
let queue_item ?u r =
Time.now (),
Message (r, u)
let drop_request (w : dropbox t) request =
let Dropbox { merge } = w.table.buffer_kind in
let Dropbox_buffer message_box = w.buffer in
try
match
match Lwt_dropbox.peek message_box with
| None ->
merge w (Any_request request) None
| Some (_, Message (old, _)) ->
Lwt.ignore_result (Lwt_dropbox.take message_box) ;
merge w (Any_request request) (Some (Any_request old))
with
| None -> ()
| Some (Any_request neu) ->
Lwt_dropbox.put message_box (Time.now (), Message (neu, None))
with Lwt_dropbox.Closed -> ()
let push_request (type a) (w : a queue t) request =
match w.buffer with
| Queue_buffer message_queue ->
Lwt_pipe.push message_queue (queue_item request)
| Bounded_buffer message_queue ->
Lwt_pipe.push message_queue (queue_item request)
let push_request_now (w : infinite queue t) request =
let Queue_buffer message_queue = w.buffer in
Lwt_pipe.push_now_exn message_queue (queue_item request)
let try_push_request_now (w : bounded queue t) request =
let Bounded_buffer message_queue = w.buffer in
Lwt_pipe.push_now message_queue (queue_item request)
let push_request_and_wait (type a) (w : a queue t) request =
let message_queue = match w.buffer with
| Queue_buffer message_queue -> message_queue
| Bounded_buffer message_queue -> message_queue in
let t, u = Lwt.wait () in
Lwt.catch
(fun () ->
Lwt_pipe.push message_queue (queue_item ~u request) >>= fun () ->
t)
(function
| Lwt_pipe.Closed -> fail (Closed w.name)
| exn -> fail (Exn exn))
let close (type a) (w : a t) =
let wakeup = function
| _, Message (_, Some u) ->
Lwt.wakeup_later u (Error [ Closed w.name ])
| _ -> () in
let close_queue message_queue =
let messages = Lwt_pipe.pop_all_now message_queue in
List.iter wakeup messages ;
Lwt_pipe.close message_queue in
match w.buffer with
| Queue_buffer message_queue -> close_queue message_queue
| Bounded_buffer message_queue -> close_queue message_queue
| Dropbox_buffer message_box ->
Option.iter ~f:wakeup (Lwt_dropbox.peek message_box) ;
Lwt_dropbox.close message_box
let pop (type a) (w : a t) =
let pop_queue message_queue =
match w.timeout with
| None ->
Lwt_pipe.pop message_queue >>= fun m ->
return (Some m)
| Some timeout ->
Lwt_pipe.pop_with_timeout
(Lwt_unix.sleep timeout) message_queue >>= fun m ->
2018-01-22 18:25:48 +04:00
return m in
match w.buffer with
| Queue_buffer message_queue -> pop_queue message_queue
| Bounded_buffer message_queue -> pop_queue message_queue
| Dropbox_buffer message_box ->
match w.timeout with
| None ->
Lwt_dropbox.take message_box >>= fun m ->
return (Some m)
| Some timeout ->
Lwt_dropbox.take_with_timeout
(Lwt_unix.sleep timeout) message_box >>= fun m ->
2018-01-22 18:25:48 +04:00
return m
let trigger_shutdown w =
Lwt.ignore_result (Lwt_canceler.cancel w.canceler)
let canceler { canceler } = canceler
let log_event w evt =
2018-02-26 17:11:10 +04:00
let (module Logger) = w.logger in
2018-01-22 18:25:48 +04:00
let level = Event.level evt in
let log =
match level with
| Debug -> Logger.lwt_debug
| Info -> Logger.lwt_log_info
| Notice -> Logger.lwt_log_notice
| Warning -> Logger.lwt_warn
| Error -> Logger.lwt_log_error
| Fatal -> Logger.lwt_fatal_error in
2018-02-26 17:11:10 +04:00
log "@[<v 0>%a@]" Event.pp evt >>= fun () ->
if level >= w.limits.backlog_level then
Ring.add (List.assoc level w.event_log) evt ;
2018-01-22 18:25:48 +04:00
Lwt.return_unit
let record_event w evt =
Lwt.ignore_result (log_event w evt)
module type HANDLERS = sig
type self
val on_launch :
self -> Name.t -> Types.parameters -> Types.state Lwt.t
val on_request :
self -> 'a Request.t -> 'a tzresult Lwt.t
val on_no_request :
self -> unit tzresult Lwt.t
val on_close :
self -> unit Lwt.t
val on_error :
self -> Request.view -> Worker_types.request_status -> error list -> unit tzresult Lwt.t
2018-01-22 18:25:48 +04:00
val on_completion :
self -> 'a Request.t -> 'a -> Worker_types.request_status -> unit Lwt.t
2018-01-22 18:25:48 +04:00
end
let create_table buffer_kind =
{ buffer_kind ;
last_id = 0 ;
instances = Hashtbl.create 10 ;
zombies = Hashtbl.create 10 }
let worker_loop (type kind) handlers (w : kind t) =
let (module Handlers : HANDLERS with type self = kind t) = handlers in
2018-02-26 17:11:10 +04:00
let (module Logger) = w.logger in
2018-01-22 18:25:48 +04:00
let do_close errs =
let t0 = match w.status with
| Running t0 -> t0
| _ -> assert false in
w.status <- Closing (t0, Time.now ()) ;
close w ;
Lwt_canceler.cancel w.canceler >>= fun () ->
w.status <- Closed (t0, Time.now (), errs) ;
Hashtbl.remove w.table.instances w.name ;
2018-02-26 17:11:10 +04:00
Handlers.on_close w >>= fun () ->
w.state <- None ;
2018-01-22 18:25:48 +04:00
Hashtbl.add w.table.zombies w.id w ;
Lwt.ignore_result
(Lwt_unix.sleep w.limits.zombie_memory >>= fun () ->
List.iter (fun (_, ring) -> Ring.clear ring) w.event_log ;
Lwt_unix.sleep (w.limits.zombie_lifetime -. w.limits.zombie_memory) >>= fun () ->
Hashtbl.remove w.table.zombies w.id ;
Lwt.return ()) ;
Lwt.return_unit in
let rec loop () =
begin
protect ~canceler:w.canceler begin fun () ->
2018-01-22 18:25:48 +04:00
pop w
end >>=? function
| None -> Handlers.on_no_request w
| Some (pushed, Message (request, u)) ->
let current_request = Request.view request in
let treated = Time.now () in
w.current_request <- Some (pushed, treated, current_request) ;
2018-02-26 17:11:10 +04:00
Logger.debug "@[<v 2>Request:@,%a@]"
2018-01-22 18:25:48 +04:00
Request.pp current_request ;
match u with
| None ->
Handlers.on_request w request >>=? fun res ->
let completed = Time.now () in
w.current_request <- None ;
Handlers.on_completion w
request res Worker_types.{ pushed ; treated ; completed } >>= fun () ->
2018-01-22 18:25:48 +04:00
return ()
| Some u ->
Handlers.on_request w request >>= fun res ->
Lwt.wakeup_later u res ;
Lwt.return res >>=? fun res ->
let completed = Time.now () in
w.current_request <- None ;
Handlers.on_completion w
request res Worker_types.{ pushed ; treated ; completed } >>= fun () ->
2018-01-22 18:25:48 +04:00
return ()
end >>= function
| Ok () ->
loop ()
| Error [Canceled | Exn Lwt_pipe.Closed | Exn Lwt_dropbox.Closed ] ->
2018-02-26 17:11:10 +04:00
Logger.lwt_log_notice "Worker terminated" >>= fun () ->
2018-01-22 18:25:48 +04:00
do_close None
| Error errs ->
begin match w.current_request with
| Some (pushed, treated, request) ->
let completed = Time.now () in
w.current_request <- None ;
Handlers.on_error w
request Worker_types.{ pushed ; treated ; completed } errs
2018-01-22 18:25:48 +04:00
| None -> assert false
end >>= function
| Ok () ->
loop ()
| Error errs ->
Logger.lwt_log_error
2018-02-26 17:11:10 +04:00
"@[<v 0>Worker crashed:@,%a@]"
(Format.pp_print_list Error_monad.pp) errs >>= fun () ->
2018-01-22 18:25:48 +04:00
do_close (Some errs) in
loop ()
let launch
: type kind.
kind table -> ?timeout:float ->
Worker_types.limits -> Name.t -> Types.parameters ->
2018-01-22 18:25:48 +04:00
(module HANDLERS with type self = kind t) ->
kind t Lwt.t
= fun table ?timeout limits name parameters (module Handlers) ->
2018-02-26 17:11:10 +04:00
let name_s =
Format.asprintf "%a" Name.pp name in
let full_name =
if name_s = "" then base_name else Format.asprintf "%s(%s)" base_name name_s in
let id =
table.last_id <- table.last_id + 1 ;
table.last_id in
let id_name =
if name_s = "" then base_name else Format.asprintf "%s(%d)" base_name id in
2018-01-22 18:25:48 +04:00
if Hashtbl.mem table.instances name then
2018-02-26 17:11:10 +04:00
invalid_arg (Format.asprintf "Lwt_worker.launch: duplicate worker %s" full_name) ;
2018-01-22 18:25:48 +04:00
let canceler = Lwt_canceler.create () in
let buffer : kind buffer =
match table.buffer_kind with
| Queue ->
Queue_buffer (Lwt_pipe.create ())
| Bounded { size } ->
Bounded_buffer (Lwt_pipe.create ~size:(size, (fun _ -> 1)) ())
| Dropbox _ ->
Dropbox_buffer (Lwt_dropbox.create ()) in
let event_log =
let levels =
[ Logging.Debug ; Info ; Notice ; Warning ; Error ; Fatal ] in
List.map (fun l -> l, Ring.create limits.backlog_size) levels in
2018-02-26 17:11:10 +04:00
let module Logger = Logging.Make(struct let name = id_name end) in
2018-01-22 18:25:48 +04:00
let w = { limits ; parameters ; name ; canceler ;
2018-02-26 17:11:10 +04:00
table ; buffer ; logger = (module Logger) ;
state = None ; id ;
2018-01-22 18:25:48 +04:00
worker = Lwt.return_unit ;
event_log ; timeout ;
current_request = None ;
status = Launching (Time.now ())} in
2018-02-26 17:11:10 +04:00
begin
if id_name = base_name then
Logger.lwt_log_notice "Worker started"
else
Logger.lwt_log_notice "Worker started for %s" name_s
end >>= fun () ->
2018-01-22 18:25:48 +04:00
Hashtbl.add table.instances name w ;
Handlers.on_launch w name parameters >>= fun state ->
w.status <- Running (Time.now ()) ;
w.state <- Some state ;
w.worker <-
Lwt_utils.worker
2018-02-26 17:11:10 +04:00
full_name
2018-01-22 18:25:48 +04:00
~run:(fun () -> worker_loop (module Handlers) w)
~cancel:(fun () -> Lwt_canceler.cancel w.canceler) ;
Lwt.return w
let shutdown w =
2018-02-26 17:11:10 +04:00
let (module Logger) = w.logger in
Logger.lwt_debug "Triggering shutdown" >>= fun () ->
2018-01-22 18:25:48 +04:00
Lwt_canceler.cancel w.canceler >>= fun () ->
w.worker
let state w =
2018-02-26 17:11:10 +04:00
match w.state, w.status with
| None, Launching _ ->
2018-01-22 18:25:48 +04:00
invalid_arg
2018-02-26 17:11:10 +04:00
(Format.asprintf
"Lwt_worker.state (%s[%a]): \
state called before worker was initialized"
base_name Name.pp w.name)
| None, (Closing _ | Closed _) ->
invalid_arg
(Format.asprintf
"Lwt_worker.state (%s[%a]): \
state called after worker was terminated"
base_name Name.pp w.name)
| None, _ -> assert false
| Some state, _ -> state
2018-01-22 18:25:48 +04:00
let last_events w =
List.map
(fun (level, ring) -> (level, Ring.elements ring))
w.event_log
let pending_requests (type a) (w : a queue t) =
let message_queue = match w.buffer with
| Queue_buffer message_queue -> message_queue
| Bounded_buffer message_queue -> message_queue in
List.map
(function (t, Message (req, _)) -> t, Request.view req)
(Lwt_pipe.peek_all message_queue)
let status { status } = status
let current_request { current_request } = current_request
let view w =
Types.view (state w) w.parameters
let list { instances } =
Hashtbl.fold
(fun n w acc -> (n, w) :: acc)
instances []
let protect { canceler } ?on_error f =
protect ?on_error ~canceler f
2018-01-22 18:25:48 +04:00
end