ligo/src/lib_shell/prevalidator.ml

583 lines
21 KiB
OCaml
Raw Normal View History

2016-09-08 21:13:10 +04:00
(**************************************************************************)
(* *)
2018-02-06 00:17:03 +04:00
(* Copyright (c) 2014 - 2018. *)
2016-09-08 21:13:10 +04:00
(* Dynamic Ledger Solutions, Inc. <contact@tezos.com> *)
(* *)
(* All rights reserved. No warranty, explicit or implicit, provided. *)
(* *)
(**************************************************************************)
open Prevalidator_worker_state
type limits = {
max_refused_operations : int ;
operation_timeout : float ;
worker_limits : Worker_types.limits ;
}
module Name = struct
2018-02-16 04:26:24 +04:00
type t = Chain_id.t
let encoding = Chain_id.encoding
let base = [ "prevalidator" ]
2018-02-16 04:26:24 +04:00
let pp = Chain_id.pp_short
end
module Types = struct
(* Invariants:
- an operation is in only one of these sets (map domains):
pv.refusals pv.pending pv.fetching pv.live_operations pv.in_mempool
- pv.in_mempool is the domain of all fields of pv.prevalidation_result
- pv.prevalidation_result.refused = Ø, refused ops are in pv.refused
- the 'applied' operations in pv.validation_result are in reverse order. *)
type state = {
2018-02-16 04:26:24 +04:00
chain_db : Distributed_db.chain_db ;
limits : limits ;
mutable predecessor : State.Block.t ;
mutable timestamp : Time.t ;
mutable live_blocks : Block_hash.Set.t ; (* just a cache *)
mutable live_operations : Operation_hash.Set.t ; (* just a cache *)
refused : Operation_hash.t Ring.t ;
mutable refusals : error list Operation_hash.Map.t ;
mutable fetching : Operation_hash.Set.t ;
mutable pending : Operation.t Operation_hash.Map.t ;
mutable mempool : Mempool.t ;
mutable in_mempool : Operation_hash.Set.t ;
mutable validation_result : error Preapply_result.t ;
mutable validation_state : Prevalidation.prevalidation_state tzresult ;
mutable advertisement : [ `Pending of Mempool.t | `None ] ;
mutable rpc_directory : state RPC_directory.t tzresult Lwt.t lazy_t ;
}
2018-02-16 04:26:24 +04:00
type parameters = limits * Distributed_db.chain_db
include Worker_state
let view (state : state) _ : view =
let domain map =
Operation_hash.Map.fold
(fun elt _ acc -> Operation_hash.Set.add elt acc)
map Operation_hash.Set.empty in
{ head = State.Block.hash state.predecessor ;
timestamp = state.timestamp ;
fetching = state.fetching ;
pending = domain state.pending ;
applied =
List.rev
(List.map (fun (h, _) -> h)
state.validation_result.applied) ;
delayed =
Operation_hash.Set.union
(domain state.validation_result.branch_delayed)
(domain state.validation_result.branch_refused) }
end
module Worker = Worker.Make (Name) (Event) (Request) (Types)
open Types
type t = Worker.infinite Worker.queue Worker.t
type error += Closed = Worker.Closed
let debug w =
Format.kasprintf (fun msg -> Worker.record_event w (Debug msg))
2016-09-08 21:13:10 +04:00
let empty_rpc_directory : unit RPC_directory.t =
RPC_directory.register
RPC_directory.empty
(Block_services.Empty.S.Mempool.pending_operations RPC_path.open_root)
(fun _pv () () ->
return {
Block_services.Empty.Mempool.applied = [] ;
refused = Operation_hash.Map.empty ;
branch_refused = Operation_hash.Map.empty ;
branch_delayed = Operation_hash.Map.empty ;
unprocessed = Operation_hash.Map.empty ;
})
let rpc_directory protocol =
begin
match Registered_protocol.get protocol with
| None ->
(* FIXME. *)
(* This should not happen: it should be handled in the validator. *)
failwith "Prevalidation: missing protocol '%a' for the current block."
Protocol_hash.pp_short protocol
| Some protocol ->
return protocol
end >>=? fun (module Proto) ->
let module Proto_services = Block_services.Make(Proto)(Proto) in
return @@
RPC_directory.register
RPC_directory.empty
(Proto_services.S.Mempool.pending_operations RPC_path.open_root)
(fun pv () () ->
let map_op op =
let protocol_data =
Data_encoding.Binary.of_bytes_exn
Proto.operation_data_encoding
op.Operation.proto in
{ Proto.shell = op.shell ; protocol_data } in
let map_op_error (op, error) = (map_op op, error) in
return {
Proto_services.Mempool.applied =
List.map
(fun (hash, op) -> (hash, map_op op))
(List.rev pv.validation_result.applied) ;
refused =
Operation_hash.Map.map map_op_error pv.validation_result.refused ;
branch_refused =
Operation_hash.Map.map map_op_error pv.validation_result.branch_refused ;
branch_delayed =
Operation_hash.Map.map map_op_error pv.validation_result.branch_delayed ;
unprocessed =
Operation_hash.Map.map map_op pv.pending ;
})
2018-02-16 04:26:24 +04:00
let list_pendings ?maintain_chain_db ~from_block ~to_block old_mempool =
let rec pop_blocks ancestor block mempool =
let hash = State.Block.hash block in
if Block_hash.equal hash ancestor then
Lwt.return mempool
else
State.Block.all_operations block >>= fun operations ->
Lwt_list.fold_left_s
(Lwt_list.fold_left_s (fun mempool op ->
let h = Operation.hash op in
2018-02-16 04:26:24 +04:00
Lwt_utils.may maintain_chain_db
~f:begin fun chain_db ->
Distributed_db.inject_operation chain_db h op >>= fun _ ->
Lwt.return_unit
end >>= fun () ->
Lwt.return (Operation_hash.Map.add h op mempool)))
mempool operations >>= fun mempool ->
State.Block.predecessor block >>= function
| None -> assert false
| Some predecessor -> pop_blocks ancestor predecessor mempool
in
let push_block mempool block =
State.Block.all_operation_hashes block >|= fun operations ->
2018-02-16 04:26:24 +04:00
Option.iter maintain_chain_db
~f:(fun chain_db ->
List.iter
2018-02-16 04:26:24 +04:00
(List.iter (Distributed_db.Operation.clear_or_cancel chain_db))
operations) ;
List.fold_left
(List.fold_left (fun mempool h -> Operation_hash.Map.remove h mempool))
mempool operations
in
Chain_traversal.new_blocks ~from_block ~to_block >>= fun (ancestor, path) ->
pop_blocks
(State.Block.hash ancestor)
from_block old_mempool >>= fun mempool ->
Lwt_list.fold_left_s push_block mempool path >>= fun new_mempool ->
Chain_traversal.live_blocks
to_block
(State.Block.max_operations_ttl to_block)
>>= fun (live_blocks, live_operations) ->
let new_mempool, outdated =
Operation_hash.Map.partition
(fun _oph op ->
Block_hash.Set.mem op.Operation.shell.branch live_blocks)
new_mempool in
Option.iter maintain_chain_db
~f:(fun chain_db ->
Operation_hash.Map.iter
(fun oph _op -> Distributed_db.Operation.clear_or_cancel chain_db oph)
outdated) ;
Lwt.return (new_mempool, live_blocks, live_operations)
2017-11-17 20:17:48 +04:00
let already_handled pv oph =
Operation_hash.Map.mem oph pv.refusals
2017-11-17 20:17:48 +04:00
|| Operation_hash.Map.mem oph pv.pending
|| Operation_hash.Set.mem oph pv.fetching
|| Operation_hash.Set.mem oph pv.live_operations
|| Operation_hash.Set.mem oph pv.in_mempool
2016-09-08 21:13:10 +04:00
2017-11-17 20:17:48 +04:00
let mempool_of_prevalidation_result (r : error Preapply_result.t) : Mempool.t =
{ Mempool.known_valid = List.map fst r.applied ;
2017-11-17 20:17:48 +04:00
pending =
Operation_hash.Map.fold
(fun k _ s -> Operation_hash.Set.add k s)
r.branch_delayed @@
Operation_hash.Map.fold
(fun k _ s -> Operation_hash.Set.add k s)
r.branch_refused @@
Operation_hash.Set.empty }
2017-11-17 20:17:48 +04:00
let merge_validation_results ~old ~neu =
let open Preapply_result in
let merge _key a b =
match a, b with
| None, None -> None
| Some x, None -> Some x
| _, Some y -> Some y in
let filter_out s m =
List.fold_right (fun (h, _op) -> Operation_hash.Map.remove h) s m in
{ applied = List.rev_append neu.applied old.applied ;
refused = Operation_hash.Map.empty ;
branch_refused =
Operation_hash.Map.merge merge
(* filtering should not be required if the protocol is sound *)
(filter_out neu.applied old.branch_refused)
neu.branch_refused ;
branch_delayed =
Operation_hash.Map.merge merge
(filter_out neu.applied old.branch_delayed)
neu.branch_delayed }
2016-09-08 21:13:10 +04:00
let advertise (w : t) pv mempool =
match pv.advertisement with
| `Pending { Mempool.known_valid ; pending } ->
pv.advertisement <-
`Pending
{ known_valid = known_valid @ mempool.Mempool.known_valid ;
pending = Operation_hash.Set.union pending mempool.pending }
| `None ->
pv.advertisement <- `Pending mempool ;
Lwt.async (fun () ->
Lwt_unix.sleep 0.01 >>= fun () ->
Worker.push_request_now w Advertise ;
Lwt.return_unit)
let handle_unprocessed w pv =
2017-11-17 20:17:48 +04:00
begin match pv.validation_state with
| Error err ->
pv.validation_result <-
{ Preapply_result.empty with
branch_delayed =
Operation_hash.Map.fold
(fun h op m -> Operation_hash.Map.add h (op, err) m)
pv.pending Operation_hash.Map.empty } ;
pv.pending <-
Operation_hash.Map.empty ;
2018-06-26 13:07:12 +04:00
Lwt.return_unit
2017-11-17 20:17:48 +04:00
| Ok validation_state ->
match Operation_hash.Map.cardinal pv.pending with
2018-06-26 13:07:12 +04:00
| 0 -> Lwt.return_unit
| n -> debug w "processing %d operations" n ;
Prevalidation.prevalidate validation_state ~sort:true
(Operation_hash.Map.bindings pv.pending)
>>= fun (validation_state, validation_result) ->
pv.validation_state <-
Ok validation_state ;
pv.in_mempool <-
(Operation_hash.Map.fold
(fun h _ in_mempool -> Operation_hash.Set.add h in_mempool)
pv.pending @@
Operation_hash.Map.fold
(fun h _ in_mempool -> Operation_hash.Set.remove h in_mempool)
pv.validation_result.refused @@
pv.in_mempool) ;
Operation_hash.Map.iter
(fun h (_, errs) ->
Option.iter (Ring.add_and_return_erased pv.refused h)
~f:(fun e -> pv.refusals <- Operation_hash.Map.remove e pv.refusals) ;
pv.refusals <-
Operation_hash.Map.add h errs pv.refusals)
pv.validation_result.refused ;
Operation_hash.Map.iter
2018-02-16 04:26:24 +04:00
(fun oph _ -> Distributed_db.Operation.clear_or_cancel pv.chain_db oph)
pv.validation_result.refused ;
pv.validation_result <-
merge_validation_results
~old:pv.validation_result
~neu:validation_result ;
pv.pending <-
Operation_hash.Map.empty ;
advertise w pv
(mempool_of_prevalidation_result validation_result) ;
2018-06-26 13:07:12 +04:00
Lwt.return_unit
2017-11-17 20:17:48 +04:00
end >>= fun () ->
pv.mempool <-
{ Mempool.known_valid =
List.rev_map fst pv.validation_result.applied ;
2017-11-17 20:17:48 +04:00
pending =
Operation_hash.Map.fold
(fun k _ s -> Operation_hash.Set.add k s)
pv.validation_result.branch_delayed @@
Operation_hash.Map.fold
(fun k _ s -> Operation_hash.Set.add k s)
pv.validation_result.branch_refused @@
Operation_hash.Set.empty } ;
2018-02-16 04:26:24 +04:00
State.Current_mempool.set (Distributed_db.chain_state pv.chain_db)
2017-11-17 20:17:48 +04:00
~head:(State.Block.hash pv.predecessor) pv.mempool >>= fun () ->
2018-06-26 13:07:12 +04:00
Lwt.return_unit
2017-11-17 20:17:48 +04:00
let fetch_operation w pv ?peer oph =
debug w
"fetching operation %a"
Operation_hash.pp_short oph ;
2017-11-17 20:17:48 +04:00
Distributed_db.Operation.fetch
~timeout:pv.limits.operation_timeout
2018-02-16 04:26:24 +04:00
pv.chain_db ?peer oph () >>= function
2017-11-17 20:17:48 +04:00
| Ok op ->
Worker.push_request_now w (Arrived (oph, op)) ;
2017-11-17 20:17:48 +04:00
Lwt.return_unit
| Error [ Distributed_db.Operation.Canceled _ ] ->
debug w
2017-11-17 20:17:48 +04:00
"operation %a included before being prevalidated"
Operation_hash.pp_short oph ;
2017-11-17 20:17:48 +04:00
Lwt.return_unit
| Error _ -> (* should not happen *)
Lwt.return_unit
let on_operation_arrived (pv : state) oph op =
2017-11-17 20:17:48 +04:00
pv.fetching <- Operation_hash.Set.remove oph pv.fetching ;
if not (Block_hash.Set.mem op.Operation.shell.branch pv.live_blocks) then begin
2018-02-16 04:26:24 +04:00
Distributed_db.Operation.clear_or_cancel pv.chain_db oph
2017-11-17 20:17:48 +04:00
(* TODO: put in a specific delayed map ? *)
end else if not (already_handled pv oph) (* prevent double inclusion on flush *) then begin
pv.pending <- Operation_hash.Map.add oph op pv.pending
end
let on_inject pv op =
let oph = Operation.hash op in
begin
if already_handled pv oph then
return pv.validation_result
else
Lwt.return pv.validation_state >>=? fun validation_state ->
Prevalidation.prevalidate
validation_state ~sort:false [ (oph, op) ] >>= fun (_, result) ->
match result.applied with
| [ app_oph, _ ] when Operation_hash.equal app_oph oph ->
2018-02-16 04:26:24 +04:00
Distributed_db.inject_operation pv.chain_db oph op >>= fun (_ : bool) ->
pv.pending <- Operation_hash.Map.add oph op pv.pending ;
return result
| _ ->
return result
end >>=? fun result ->
if List.mem_assoc oph result.applied then
2018-06-26 13:07:12 +04:00
return_unit
else
let try_in_map map proj or_else =
try
Lwt.return (Error (proj (Operation_hash.Map.find oph map)))
with Not_found -> or_else () in
try_in_map pv.refusals (fun h -> h) @@ fun () ->
try_in_map result.refused snd @@ fun () ->
try_in_map result.branch_refused snd @@ fun () ->
try_in_map result.branch_delayed snd @@ fun () ->
if Operation_hash.Set.mem oph pv.live_operations then
failwith "Injected operation %a included in a previous block."
Operation_hash.pp oph
2016-09-08 21:13:10 +04:00
else
failwith "Injected operation %a is not in prevalidation result."
Operation_hash.pp oph
let on_notify w pv peer mempool =
2017-11-17 20:17:48 +04:00
let all_ophs =
List.fold_left
(fun s oph -> Operation_hash.Set.add oph s)
mempool.Mempool.pending mempool.known_valid in
let to_fetch =
Operation_hash.Set.filter
(fun oph -> not (already_handled pv oph))
all_ophs in
pv.fetching <-
Operation_hash.Set.union
to_fetch
pv.fetching ;
Operation_hash.Set.iter
(fun oph -> Lwt.ignore_result (fetch_operation w pv ~peer oph))
2017-11-17 20:17:48 +04:00
to_fetch
2016-09-08 21:13:10 +04:00
let on_flush w pv predecessor =
2017-11-17 20:17:48 +04:00
list_pendings
2018-02-16 04:26:24 +04:00
~maintain_chain_db:pv.chain_db
2017-11-17 20:17:48 +04:00
~from_block:pv.predecessor ~to_block:predecessor
(Preapply_result.operations pv.validation_result)
>>= fun (pending, new_live_blocks, new_live_operations) ->
2017-11-17 20:17:48 +04:00
let timestamp = Time.now () in
Prevalidation.start_prevalidation
~predecessor ~timestamp () >>= fun validation_state ->
begin match validation_state with
| Error _ -> Lwt.return (validation_state, Preapply_result.empty)
| Ok validation_state ->
Prevalidation.prevalidate
validation_state ~sort:false [] >>= fun (state, result) ->
Lwt.return (Ok state, result)
end >>= fun (validation_state, validation_result) ->
debug w "%d operations were not washed by the flush"
(Operation_hash.Map.cardinal pending) ;
State.Block.protocol_hash pv.predecessor >>= fun old_protocol ->
State.Block.protocol_hash predecessor >>= fun new_protocol ->
2017-11-17 20:17:48 +04:00
pv.predecessor <- predecessor ;
pv.live_blocks <- new_live_blocks ;
pv.live_operations <- new_live_operations ;
pv.timestamp <- timestamp ;
pv.mempool <- { known_valid = [] ; pending = Operation_hash.Set.empty };
pv.pending <- pending ;
pv.in_mempool <- Operation_hash.Set.empty ;
pv.validation_result <- validation_result ;
pv.validation_state <- validation_state ;
if not (Protocol_hash.equal old_protocol new_protocol) then
pv.rpc_directory <- lazy (rpc_directory new_protocol) ;
2018-06-26 13:07:12 +04:00
return_unit
2016-09-08 21:13:10 +04:00
let on_advertise pv =
match pv.advertisement with
| `None -> () (* should not happen *)
| `Pending mempool ->
pv.advertisement <- `None ;
2018-02-16 04:26:24 +04:00
Distributed_db.Advertise.current_head pv.chain_db ~mempool pv.predecessor
let on_request
: type r. t -> r Request.t -> r tzresult Lwt.t
= fun w request ->
let pv = Worker.state w in
begin match request with
| Request.Flush hash ->
on_advertise pv ;
(* TODO: rebase the advertisement instead *)
2018-02-16 04:26:24 +04:00
let chain_state = Distributed_db.chain_state pv.chain_db in
State.Block.read chain_state hash >>=? fun block ->
on_flush w pv block >>=? fun () ->
return (() : r)
| Request.Notify (peer, mempool) ->
on_notify w pv peer mempool ;
2018-06-26 13:07:12 +04:00
return_unit
| Request.Inject op ->
on_inject pv op
| Request.Arrived (oph, op) ->
on_operation_arrived pv oph op ;
2018-06-26 13:07:12 +04:00
return_unit
| Request.Advertise ->
on_advertise pv ;
2018-06-26 13:07:12 +04:00
return_unit
end >>=? fun r ->
handle_unprocessed w pv >>= fun () ->
return r
let on_close w =
let pv = Worker.state w in
Operation_hash.Set.iter
2018-02-16 04:26:24 +04:00
(Distributed_db.Operation.clear_or_cancel pv.chain_db)
pv.fetching ;
Lwt.return_unit
2016-09-08 21:13:10 +04:00
2018-02-16 04:26:24 +04:00
let on_launch w _ (limits, chain_db) =
let chain_state = Distributed_db.chain_state chain_db in
Chain.data chain_state >>= fun
{ current_head = predecessor ; current_mempool = mempool ;
live_blocks ; live_operations } ->
State.Block.protocol_hash predecessor >>= fun protocol ->
2017-11-17 20:17:48 +04:00
let timestamp = Time.now () in
Prevalidation.start_prevalidation
~predecessor ~timestamp () >>= fun validation_state ->
begin match validation_state with
| Error _ -> Lwt.return (validation_state, Preapply_result.empty)
| Ok validation_state ->
Prevalidation.prevalidate validation_state ~sort:false []
>>= fun (validation_state, validation_result) ->
2016-09-08 21:13:10 +04:00
2017-11-17 20:17:48 +04:00
Lwt.return (Ok validation_state, validation_result)
end >>= fun (validation_state, validation_result) ->
let fetching =
List.fold_left
(fun s h -> Operation_hash.Set.add h s)
Operation_hash.Set.empty mempool.known_valid in
let pv =
2018-02-16 04:26:24 +04:00
{ limits ; chain_db ;
2017-11-17 20:17:48 +04:00
predecessor ; timestamp ; live_blocks ; live_operations ;
mempool = { known_valid = [] ; pending = Operation_hash.Set.empty };
refused = Ring.create limits.max_refused_operations ;
refusals = Operation_hash.Map.empty ;
2017-11-17 20:17:48 +04:00
fetching ;
pending = Operation_hash.Map.empty ;
in_mempool = Operation_hash.Set.empty ;
validation_result ; validation_state ;
advertisement = `None ;
rpc_directory = lazy (rpc_directory protocol) ;
} in
2017-11-17 20:17:48 +04:00
List.iter
(fun oph -> Lwt.ignore_result (fetch_operation w pv oph))
2017-11-17 20:17:48 +04:00
mempool.known_valid ;
Lwt.return pv
let on_error w r st errs =
Worker.record_event w (Event.Request (r, st, Some errs)) ;
match r with
2018-06-26 13:07:12 +04:00
| Request.(View (Inject _)) -> return_unit
| _ -> Lwt.return (Error errs)
2017-11-17 20:17:48 +04:00
let on_completion w r _ st =
2018-06-26 13:07:12 +04:00
Worker.record_event w (Event.Request (Request.view r, st, None)) ;
Lwt.return_unit
2017-11-17 20:17:48 +04:00
let table = Worker.create_table Queue
2017-11-17 20:17:48 +04:00
2018-02-16 04:26:24 +04:00
let create limits chain_db =
let chain_state = Distributed_db.chain_state chain_db in
let module Handlers = struct
type self = t
let on_launch = on_launch
let on_request = on_request
let on_close = on_close
let on_error = on_error
let on_completion = on_completion
2018-06-26 13:07:12 +04:00
let on_no_request _ = return_unit
end in
Worker.launch table limits.worker_limits
2018-02-16 04:26:24 +04:00
(State.Chain.id chain_state)
(limits, chain_db)
(module Handlers)
let shutdown = Worker.shutdown
let flush w head =
Worker.push_request_and_wait w (Flush head)
let notify_operations w peer mempool =
Worker.push_request_now w (Notify (peer, mempool))
let operations w =
let pv = Worker.state w in
2017-11-17 20:17:48 +04:00
{ pv.validation_result with
applied = List.rev pv.validation_result.applied },
pv.pending
let pending ?block w =
let pv = Worker.state w in
2017-11-17 20:17:48 +04:00
let ops = Preapply_result.operations pv.validation_result in
match block with
| Some to_block ->
list_pendings
~from_block:pv.predecessor ~to_block ops >>= fun (pending, _, _) ->
Lwt.return pending
2017-11-17 20:17:48 +04:00
| None -> Lwt.return ops
let timestamp w =
let pv = Worker.state w in
pv.timestamp
2017-11-17 20:17:48 +04:00
let inject_operation w op =
Worker.push_request_and_wait w (Inject op)
let status = Worker.status
let running_workers () = Worker.list table
let pending_requests t = Worker.pending_requests t
let current_request t = Worker.current_request t
let last_events = Worker.last_events
let rpc_directory : t option RPC_directory.t =
RPC_directory.register_dynamic_directory
RPC_directory.empty
(Block_services.mempool_path RPC_path.open_root)
(function
| None ->
Lwt.return
(RPC_directory.map (fun _ -> Lwt.return_unit) empty_rpc_directory)
| Some w ->
let pv = Worker.state w in
Lazy.force pv.rpc_directory >>= function
| Error _ ->
Lwt.return RPC_directory.empty
| Ok rpc_directory ->
Lwt.return
(RPC_directory.map (fun _ -> Lwt.return pv) rpc_directory))