Source file peer_validator.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
open Peer_validator_worker_state
module Name = struct
  type t = Chain_id.t * P2p_peer.Id.t
  let encoding = Data_encoding.tup2 Chain_id.encoding P2p_peer.Id.encoding
  let base = ["validator"; "peer"]
  let pp ppf (chain, peer) =
    Format.fprintf ppf "%a:%a" Chain_id.pp_short chain P2p_peer.Id.pp_short peer
  let equal (c1, p1) (c2, p2) = Chain_id.equal c1 c2 && P2p_peer.Id.equal p1 p2
end
module Request = struct
  include Request
  type (_, _) t =
    | New_head : Block_hash.t * Block_header.t -> (unit, error trace) t
    | New_branch : Block_locator.t * Block_locator.seed -> (unit, error trace) t
  let view (type a b) (req : (a, b) t) : view =
    match req with
    | New_head (hash, _) -> New_head hash
    | New_branch (locator, seed) ->
        
        New_branch
          (locator.head_hash, Block_locator.estimated_length seed locator)
end
module Types = struct
  type parameters = {
    chain_db : Distributed_db.chain_db;
    block_validator : Block_validator.t;
    
    notify_new_block : Block_validator.new_block -> unit;
    notify_termination : unit -> unit;
    limits : Shell_limits.peer_validator_limits;
  }
  type state = {
    peer_id : P2p_peer.Id.t;
    parameters : parameters;
    mutable pipeline : Bootstrap_pipeline.t option;
    mutable last_validated_head : Block_header.t;
    mutable last_advertised_head : Block_header.t;
  }
  let pipeline_length = function
    | None -> Bootstrap_pipeline.length_zero
    | Some p -> Bootstrap_pipeline.length p
end
module Events = Peer_validator_events
module Worker = Worker.MakeSingle (Name) (Request) (Types)
open Types
type t = Worker.dropbox Worker.t
let metrics = Shell_metrics.Peer_validator.init Name.base
let bootstrap_new_branch w unknown_prefix =
  let open Lwt_result_syntax in
  let pv = Worker.state w in
  let sender_id = Distributed_db.my_peer_id pv.parameters.chain_db in
  
  let seed = {Block_locator.sender_id = pv.peer_id; receiver_id = sender_id} in
  let len = Block_locator.estimated_length seed unknown_prefix in
  let*! () = Events.(emit validating_new_branch) (pv.peer_id, len) in
  let pipeline =
    Bootstrap_pipeline.create
      ~notify_new_block:pv.parameters.notify_new_block
      ~block_header_timeout:pv.parameters.limits.block_header_timeout
      ~block_operations_timeout:pv.parameters.limits.block_operations_timeout
      pv.parameters.block_validator
      pv.peer_id
      pv.parameters.chain_db
      unknown_prefix
  in
  pv.pipeline <- Some pipeline ;
  let worker_canceler = Worker.canceler w in
  Lwt_canceler.on_cancel worker_canceler (fun () ->
      pv.pipeline <- None ;
      Bootstrap_pipeline.cancel pipeline) ;
  let* () =
    protect
      ~canceler:worker_canceler
      ~on_error:(fun error ->
        
        pv.pipeline <- None ;
        let*! () = Bootstrap_pipeline.cancel pipeline in
        fail error)
      (fun () -> Bootstrap_pipeline.wait pipeline)
  in
  pv.pipeline <- None ;
  let*! () =
    Events.(emit new_branch_validated) (pv.peer_id, unknown_prefix.head_hash)
  in
  return_unit
let only_if_fitness_increases w  hash cont =
  let open Lwt_syntax in
  let pv = Worker.state w in
  let chain_store = Distributed_db.chain_store pv.parameters.chain_db in
  let* known_valid = Store.Block.is_known_valid chain_store hash in
  if known_valid then (
    pv.last_validated_head <- distant_header ;
    cont `Known_valid)
  else
    let* current_head = Store.Chain.current_head chain_store in
    if
      Fitness.compare
        distant_header.Block_header.shell.fitness
        (Store.Block.fitness current_head)
      <= 0
    then (
      let* () = Events.(emit ignoring_head) (pv.peer_id, hash) in
      
      let meta =
        Distributed_db.get_peer_metadata pv.parameters.chain_db pv.peer_id
      in
      Peer_metadata.incr meta Old_heads ;
      cont `Lower_fitness)
    else cont `Ok
let validate_new_head w hash ( : Block_header.t) =
  let open Lwt_result_syntax in
  let pv = Worker.state w in
  let block_received = (pv.peer_id, hash) in
  let*! () = Events.(emit fetching_operations_for_head) block_received in
  let* operations =
    List.map_ep
      (fun i ->
        protect ~canceler:(Worker.canceler w) (fun () ->
            Distributed_db.Operations.fetch
              ~timeout:pv.parameters.limits.block_operations_timeout
              pv.parameters.chain_db
              ~peer:pv.peer_id
              (hash, i)
              header.shell.operations_hash))
      (0 -- (header.shell.validation_passes - 1))
  in
  
  only_if_fitness_increases w header hash @@ function
  | `Known_valid | `Lower_fitness ->
      
      List.iter
        (fun i ->
          Distributed_db.Operations.clear_or_cancel
            pv.parameters.chain_db
            (hash, i))
        (0 -- (header.shell.validation_passes - 1)) ;
      return_unit
  | `Ok -> (
      let*! () = Events.(emit requesting_new_head_validation) block_received in
      let*! v =
        Block_validator.validate
          ~notify_new_block:pv.parameters.notify_new_block
          ~precheck_and_notify:true
          pv.parameters.block_validator
          pv.parameters.chain_db
          hash
          header
          operations
      in
      match v with
      | Invalid errs ->
          
          Lwt.return_error errs
      | Invalid_after_precheck _errs ->
          let*! () =
            Events.(emit ignoring_prechecked_invalid_block) block_received
          in
          
          return_unit
      | Valid ->
          let*! () = Events.(emit new_head_validation_end) block_received in
          let meta =
            Distributed_db.get_peer_metadata pv.parameters.chain_db pv.peer_id
          in
          Peer_metadata.incr meta Valid_blocks ;
          return_unit)
let assert_acceptable_head w hash ( : Block_header.t) =
  let open Lwt_result_syntax in
  let pv = Worker.state w in
  let chain_store = Distributed_db.chain_store pv.parameters.chain_db in
  let*! acceptable =
    Store.Chain.is_acceptable_block chain_store (hash, header.shell.level)
  in
  fail_unless
    acceptable
    (Validation_errors.Checkpoint_error (hash, Some pv.peer_id))
let may_validate_new_head w hash ( : Block_header.t) =
  let open Lwt_result_syntax in
  let pv = Worker.state w in
  let chain_store = Distributed_db.chain_store pv.parameters.chain_db in
  let*! valid_block = Store.Block.is_known_valid chain_store hash in
  let*! invalid_block = Store.Block.is_known_invalid chain_store hash in
  let*! valid_predecessor =
    Store.Block.is_known_valid chain_store header.shell.predecessor
  in
  let*! invalid_predecessor =
    Store.Block.is_known_invalid chain_store header.shell.predecessor
  in
  let block_received = (pv.peer_id, hash) in
  if valid_block then
    let*! () =
      Events.(emit ignoring_previously_validated_block) block_received
    in
    return_unit
  else if invalid_block then
    let*! () = Events.(emit ignoring_invalid_block) block_received in
    tzfail Validation_errors.Known_invalid
  else if invalid_predecessor then
    let*! () = Events.(emit ignoring_invalid_block) block_received in
    let* _ =
      Distributed_db.commit_invalid_block
        pv.parameters.chain_db
        hash
        header
        [Validation_errors.Known_invalid]
    in
    tzfail Validation_errors.Known_invalid
  else if not valid_predecessor then (
    let*! () = Events.(emit missing_new_head_predecessor) block_received in
    Distributed_db.Request.current_branch pv.parameters.chain_db pv.peer_id ;
    return_unit)
  else
    only_if_fitness_increases w header hash @@ function
    | `Known_valid | `Lower_fitness -> return_unit
    | `Ok ->
        let* () = assert_acceptable_head w hash header in
        validate_new_head w hash header
let may_validate_new_branch w locator =
  let open Lwt_result_syntax in
  
  let pv = Worker.state w in
  let {Block_locator.head_header = ; head_hash = distant_hash; _}
      =
    locator
  in
  only_if_fitness_increases w distant_header distant_hash @@ function
  | `Known_valid | `Lower_fitness -> return_unit
  | `Ok -> (
      let* () = assert_acceptable_head w distant_hash distant_header in
      let chain_store = Distributed_db.chain_store pv.parameters.chain_db in
      
      let block_received = (pv.peer_id, distant_hash) in
      let*! v =
        Block_locator.unknown_prefix
          ~is_known:(Store.Block.validity chain_store)
          locator
      in
      match v with
      | Known_valid, {history = []; _} -> return_unit
      | Known_valid, {history = [x]; ; head_hash}
        when Block_hash.equal x head_header.shell.predecessor ->
          validate_new_head w head_hash head_header
      | Known_valid, prefix_locator -> bootstrap_new_branch w prefix_locator
      | Unknown, _ ->
          
          let*! () =
            Events.(emit ignoring_branch_without_common_ancestor) block_received
          in
          tzfail Validation_errors.Unknown_ancestor
      | Known_invalid, _ ->
          let*! () =
            Events.(emit ignoring_branch_with_invalid_locator) block_received
          in
          tzfail (Validation_errors.Invalid_locator (pv.peer_id, locator)))
let on_no_request w =
  let open Lwt_syntax in
  let pv = Worker.state w in
  Prometheus.Counter.inc_one metrics.on_no_request ;
  let timespan = pv.parameters.limits.new_head_request_timeout in
  let* () = Events.(emit no_new_head_from_peer) (pv.peer_id, timespan) in
  Distributed_db.Request.current_head_from_peer
    pv.parameters.chain_db
    pv.peer_id ;
  Lwt.return_unit
let on_request (type a b) w (req : (a, b) Request.t) : (a, b) result Lwt.t =
  let open Lwt_syntax in
  let pv = Worker.state w in
  match req with
  | Request.New_head (hash, ) ->
      let* () = Events.(emit processing_new_head) (pv.peer_id, hash) in
      may_validate_new_head w hash header
  | Request.New_branch (locator, _seed) ->
      
      let* () =
        Events.(emit processing_new_branch) (pv.peer_id, locator.head_hash)
      in
      may_validate_new_branch w locator
let on_completion (type a request_error) _w (r : (a, request_error) Request.t) _
    st =
  (match r with
  | Request.New_head _ -> Prometheus.Counter.inc_one metrics.new_head_completed
  | Request.New_branch _ ->
      Prometheus.Counter.inc_one metrics.new_branch_completed) ;
  Events.(emit request_completed) (Request.view r, st)
let on_error (type a b) w st (request : (a, b) Request.t) (err : b) :
    unit tzresult Lwt.t =
  let open Lwt_syntax in
  let pv = Worker.state w in
  let on_error_trace err =
    let request_view = Request.view request in
    match err with
    | (( Validation_errors.Invalid_locator _
       | Block_validator_errors.Invalid_block _ ) as e)
      :: _ ->
        let* () = Distributed_db.greylist pv.parameters.chain_db pv.peer_id in
        let* () =
          Events.(emit terminating_worker)
            (pv.peer_id, "invalid data received: kickban")
        in
        (match e with
        | Validation_errors.Invalid_locator _ ->
            Prometheus.Counter.inc_one metrics.invalid_locator
        | Block_validator_errors.Invalid_block _ ->
            Prometheus.Counter.inc_one metrics.invalid_block
        | _ ->  ()) ;
        Worker.trigger_shutdown w ;
        let* () = Events.(emit request_error) (request_view, st, err) in
        Lwt.return_error err
    | Block_validator_errors.System_error _ :: _ ->
        Prometheus.Counter.inc_one metrics.system_error ;
        let* () = Events.(emit request_error) (request_view, st, err) in
        return_ok_unit
    | Block_validator_errors.Unavailable_protocol {protocol; _} :: _ -> (
        Prometheus.Counter.inc_one metrics.unavailable_protocol ;
        let* fetched_and_compiled =
          Block_validator.fetch_and_compile_protocol
            pv.parameters.block_validator
            ~peer:pv.peer_id
            ~timeout:pv.parameters.limits.protocol_timeout
            protocol
        in
        match fetched_and_compiled with
        | Ok _ ->
            Distributed_db.Request.current_head_from_peer
              pv.parameters.chain_db
              pv.peer_id ;
            return_ok_unit
        | Error _ ->
            
            let* () =
              Events.(emit terminating_worker)
                ( pv.peer_id,
                  Format.asprintf
                    "missing protocol: %a"
                    Protocol_hash.pp
                    protocol )
            in
            let* () = Events.(emit request_error) (request_view, st, err) in
            Lwt.return_error err)
    | (( Validation_errors.Unknown_ancestor
       | Validation_errors.Too_short_locator _ ) as e)
      :: _ ->
        (match e with
        | Validation_errors.Unknown_ancestor ->
            Prometheus.Counter.inc_one metrics.unknown_ancestor
        | Validation_errors.Too_short_locator _ ->
            Prometheus.Counter.inc_one metrics.too_short_locator
        | _ ->  ()) ;
        let* () =
          Events.(emit terminating_worker)
            ( pv.peer_id,
              Format.asprintf "unknown ancestor or too short locator: kick" )
        in
        let* () = Events.(emit insufficient_history) pv.peer_id in
        Worker.trigger_shutdown w ;
        return_ok_unit
    | Distributed_db.Operations.Canceled _ :: _ -> (
        
        match request_view with
        | New_head hash -> (
            let chain_store =
              Distributed_db.chain_store pv.parameters.chain_db
            in
            let* b = Store.Block.is_known_valid chain_store hash in
            match b with
            | true ->
                Prometheus.Counter.inc_one
                  metrics.operations_fetching_canceled_new_known_valid_head ;
                return_ok_unit
            | false ->
                Prometheus.Counter.inc_one
                  metrics.operations_fetching_canceled_new_unknown_head ;
                Lwt.return_error err)
        | _ ->
            Prometheus.Counter.inc_one
              metrics.operations_fetching_canceled_new_branch ;
            Lwt.return_error err)
    | Canceled :: _ ->
        let* () =
          Events.(emit terminating_worker)
            (pv.peer_id, Format.asprintf "canceled")
        in
        let* () = Peer_validator_events.(emit peer_disconnection) pv.peer_id in
        Worker.trigger_shutdown w ;
        return_ok_unit
    | _ ->
        Prometheus.Counter.inc_one metrics.unknown_error ;
        let* () = Events.(emit request_error) (request_view, st, err) in
        Lwt.return_error err
  in
  match request with
  | New_head _ -> on_error_trace err
  | New_branch _ -> on_error_trace err
let on_close w =
  let pv = Worker.state w in
  
  let (_ : unit Lwt.t) =
    Distributed_db.disconnect
      ~reason:"peer validator shutdown"
      pv.parameters.chain_db
      pv.peer_id
  in
  pv.parameters.notify_termination () ;
  Lwt.return_unit
type launch_error = |
let on_launch _ name parameters : (_, launch_error) result Lwt.t =
  let open Lwt_syntax in
  let chain_store = Distributed_db.chain_store parameters.chain_db in
  let* genesis = Store.Chain.genesis_block chain_store in
  
  let rec pv =
    {
      peer_id = snd name;
      parameters = {parameters with notify_new_block};
      pipeline = None;
      last_validated_head = Store.Block.header genesis;
      last_advertised_head = Store.Block.header genesis;
    }
  and notify_new_block ({block; _} as new_block) =
    pv.last_validated_head <- Store.Block.header block ;
    parameters.notify_new_block new_block
  in
  Prometheus.Counter.inc_one metrics.connections ;
  Lwt.return (Ok pv)
let table =
  let merge w (Worker.Any_request neu) old =
    let pv = Worker.state w in
    match neu with
    | Request.New_branch (locator, _) ->
        pv.last_advertised_head <- locator.Block_locator.head_header ;
        Some (Worker.Any_request neu)
    | Request.New_head (_, ) -> (
        pv.last_advertised_head <- header ;
        
        match old with
        | Some (Worker.Any_request (Request.New_branch _) as old) ->
            Some old 
        | Some (Worker.Any_request (Request.New_head _)) ->
            Some (Any_request neu)
        | None -> Some (Any_request neu))
  in
  Worker.create_table (Dropbox {merge})
let create ?(notify_new_block = fun _ -> ()) ?(notify_termination = fun _ -> ())
    limits block_validator chain_db peer_id =
  let name =
    (Store.Chain.chain_id (Distributed_db.chain_store chain_db), peer_id)
  in
  let parameters =
    {chain_db; notify_termination; block_validator; notify_new_block; limits}
  in
  let module Handlers = struct
    type self = t
    type nonrec launch_error = launch_error
    let on_launch = on_launch
    let on_request = on_request
    let on_close = on_close
    let on_error = on_error
    let on_completion = on_completion
    let on_no_request = on_no_request
  end in
  let open Lwt_syntax in
  let* (Ok worker) =
    Worker.launch
      table
      ~timeout:limits.new_head_request_timeout
      name
      parameters
      (module Handlers)
  in
  Lwt.return worker
let notify_branch w locator =
  let pv = Worker.state w in
  let sender_id = Distributed_db.my_peer_id pv.parameters.chain_db in
  
  let seed = {Block_locator.sender_id = pv.peer_id; receiver_id = sender_id} in
  Worker.Dropbox.put_request w (New_branch (locator, seed))
let notify_head w hash  =
  Worker.Dropbox.put_request w (New_head (hash, header))
let shutdown w = Worker.shutdown w
let peer_id w =
  let pv = Worker.state w in
  pv.peer_id
let status = Worker.status
let information = Worker.information
let running_workers () = Worker.list table
let current_request t = Worker.current_request t
let pipeline_length w =
  let state = Worker.state w in
  Types.pipeline_length state.pipeline
module Internal_for_tests = struct
  let validate_new_head (t : t) block_hash  =
    let open Lwt_result_syntax in
    let* () = validate_new_head t block_hash block_header in
    return_unit
end