[perf] trace pipe operations

Summary: We can fill the gaps in the trace now: they correspond to processes waiting on pipes. This suggests a more efficient protocol would help perf, at least on the small example I tried. Anyhow, it shows it's useful to trace pipe operations. Some small gaps remain but they look like they could be explained by rounding errors. Reviewed By: mbouaziz Differential Revision: D9934437 fbshipit-source-id: 1d5f53a6d
7 years ago · 590f1faac5
parent 5a894df3af
commit 590f1faac5
1 changed files with 68 additions and 41 deletions
--- a/infer/src/base/ProcessPool.ml
+++ b/infer/src/base/ProcessPool.ml
@ -60,7 +60,13 @@ type 'a boss_message =
  | GoHome  (** all tasks done, prepare for teardown *)
 (** convenience function to send data down pipes without forgetting to flush *)
-let marshal_to_pipe fd x = Marshal.to_channel fd x [] ; Out_channel.flush fd
+let marshal_to_pipe fd x =
  PerfEvent.log (fun logger ->
      PerfEvent.log_begin_event logger ~categories:["sys"] ~name:"send to pipe" () ) ;
  Marshal.to_channel fd x [] ;
  Out_channel.flush fd ;
  PerfEvent.(log (fun logger -> log_end_event logger ()))
 (** like [Unix.read] but reads until [len] bytes have been read *)
 let rec really_read ?(pos = 0) ~len fd ~buf =
@ -73,13 +79,45 @@ let rec really_read ?(pos = 0) ~len fd ~buf =
 (** return [true] if the [file_descr] is ready for reading after at most [timeout] has
     elapsed *)
-let wait_for_updates file_descr timeout =
+let wait_for_updates pool buffer =
  let file_descr = pool.children_updates in
  let timeout = if TaskBar.is_interactive pool.task_bar then refresh_timeout else `Never in
  (* Use select(2) so that we can both wait on the pipe of children updates and wait for a
     timeout. The timeout is for giving a chance to the taskbar of refreshing from time to time. *)
  let {Unix.Select_fds.read= read_fds} =
    Unix.select ~read:[file_descr] ~write:[] ~except:[] ~timeout ()
  in
-  match read_fds with _ :: _ :: _ -> assert false | [] -> false | [_file_descr] -> true
+  match read_fds with
  | _ :: _ :: _ ->
      assert false
  | [] ->
      (* not ready *) None
  | [_file_descr] ->
      (* Read one OCaml value at a time. This is done by first reading the header of the marshalled
       value (fixed size), then get the total size of the data from that header, then request a
       read of the full OCaml value.
       This way the buffer is used for only one OCaml value at a time. This is simpler (values do
       not overlap across the end of a read and the beginning of another) and means we do not need
       a large buffer as long as messages are never bigger than the buffer.
       This works somewhat like [Marshal.from_channel] but uses the file descriptor directly
       instead of an [in_channel]. Do *not* read from the pipe via an [in_channel] as they read
       as much as possible eagerly. This can empty the pipe without us having a way to tell that
       there is more to read anymore since the [select] call will return that there is nothing to
       read. *)
      really_read pool.children_updates ~buf:buffer ~len:Marshal.header_size ;
      let data_size = Marshal.data_size buffer 0 in
      really_read pool.children_updates ~buf:buffer ~pos:Marshal.header_size ~len:data_size ;
      Some (Marshal.from_bytes buffer 0)
 let wait_for_updates pool buffer =
  PerfEvent.log (fun logger ->
      PerfEvent.log_begin_event logger ~categories:["sys"] ~name:"wait for event" () ) ;
  let update = wait_for_updates pool buffer in
  PerfEvent.(log (fun logger -> log_end_event logger ())) ;
  update
 let killall pool ~slot status =
@ -106,43 +144,26 @@ let process_updates pool buffer =
  has_dead_child pool
  |> Option.iter ~f:(fun (slot, status) ->
         killall pool ~slot (Unix.Exit_or_signal.to_string_hum status) ) ;
-  let timeout = if TaskBar.is_interactive pool.task_bar then refresh_timeout else `Never in
+  match wait_for_updates pool buffer with
-  if wait_for_updates pool.children_updates timeout then (
+  | Some (UpdateStatus (slot, t, status)) ->
-    (* Read one OCaml value at a time. This is done by first reading the header of the marshalled
+      TaskBar.update_status pool.task_bar ~slot t status
-       value (fixed size), then get the total size of the data from that header, then request a
+  | Some (Crash slot) ->
-       read of the full OCaml value.
+      let {pid} = pool.slots.(slot) in
-
+      (* clean crash, give the child process a chance to cleanup *)
-       This way the buffer is used for only one OCaml value at a time. This is simpler (values do
+      Unix.wait (`Pid pid) |> ignore ;
-       not overlap across the end of a read and the beginning of another) and means we do not need
+      killall pool ~slot "see backtrace above"
-       a large buffer as long as messages are never bigger than the buffer.
+  | Some (Ready slot) -> (
-
+      TaskBar.tasks_done_add pool.task_bar 1 ;
-       This works somewhat like [Marshal.from_channel] but uses the file descriptor directly
+      match pool.tasks with
-       instead of an [in_channel]. Do *not* read from the pipe via an [in_channel] as they read
+      | [] ->
-       as much as possible eagerly. This can empty the pipe without us having a way to tell that
+          TaskBar.update_status pool.task_bar ~slot (Mtime_clock.now ()) "idle" ;
-       there is more to read anymore since the [select] call will return that there is nothing to
+          pool.idle_children <- pool.idle_children + 1
-       read. *)
+      | x :: tasks ->
-    really_read pool.children_updates ~buf:buffer ~len:Marshal.header_size ;
+          pool.tasks <- tasks ;
-    let data_size = Marshal.data_size buffer 0 in
+          let {down_pipe} = pool.slots.(slot) in
-    really_read pool.children_updates ~buf:buffer ~pos:Marshal.header_size ~len:data_size ;
+          marshal_to_pipe down_pipe (Do x) )
-    let update = Marshal.from_bytes buffer 0 in
+  | None ->
-    match update with
+      ()
    | UpdateStatus (slot, t, status) ->
        TaskBar.update_status pool.task_bar ~slot t status
    | Crash slot ->
        let {pid} = pool.slots.(slot) in
        (* clean crash, give the child process a chance to cleanup *)
        Unix.wait (`Pid pid) |> ignore ;
        killall pool ~slot "see backtrace above"
    | Ready slot -> (
        TaskBar.tasks_done_add pool.task_bar 1 ;
        match pool.tasks with
        | [] ->
            TaskBar.update_status pool.task_bar ~slot (Mtime_clock.now ()) "idle" ;
            pool.idle_children <- pool.idle_children + 1
        | x :: tasks ->
            pool.tasks <- tasks ;
            let {down_pipe} = pool.slots.(slot) in
            marshal_to_pipe down_pipe (Do x) ) )
 (** terminate all worker processes *)
@ -220,7 +241,13 @@ let fork_child ~child_prelude ~slot (updates_r, updates_w) ~f =
      in
      ProcessPoolState.update_status := update_status ;
      let orders_ic = Unix.in_channel_of_descr to_child_r in
-      let receive_from_parent () = Marshal.from_channel orders_ic in
+      let receive_from_parent () =
        PerfEvent.log (fun logger ->
            PerfEvent.log_begin_event logger ~categories:["sys"] ~name:"receive from pipe" () ) ;
        let x = Marshal.from_channel orders_ic in
        PerfEvent.(log (fun logger -> log_end_event logger ())) ;
        x
      in
      child_loop ~slot send_to_parent receive_from_parent ~f ;
      Out_channel.close updates_oc ;
      In_channel.close orders_ic ;