test: better tracing and scalability for echo client/server

This commit is contained in:
Simon Cruanes 2025-05-02 13:48:54 -04:00
parent 74f87af96c
commit b0a29618e7
No known key found for this signature in database
GPG key ID: EBFFF6F283F3A2B4
4 changed files with 131 additions and 47 deletions

View file

@ -0,0 +1,6 @@
notes about system limits in Linux:
- `ulimit -n 100000` will raise the max number of FDs for a process to 100000
- `/proc/sys/net/core/netdev_max_backlog` controls the kernel backlog size, raise it (default is 1000)
- `/proc/sys/net/core/somaxconn` is the max size of a socket backlog (as given to `listen()`), raise it (default is 4096)

View file

@ -1,4 +1,4 @@
(executables (executables
(names echo_server echo_client) (names echo_server echo_client)
(libraries moonpool moonpool.fib nanoev.picos nanoev-posix iostream (libraries moonpool moonpool.fib nanoev-picos nanoev-posix iostream
trace.core trace-tef)) trace.core trace-tef))

View file

@ -1,6 +1,7 @@
module Trace = Trace_core module Trace = Trace_core
module F = Moonpool_fib module F = Moonpool_fib
module IO = Nanoev_picos module IO = Nanoev_picos
module Sem = Picos_std_sync.Semaphore.Counting
[@@@ocaml.alert "-deprecated"] [@@@ocaml.alert "-deprecated"]
@ -8,8 +9,12 @@ let ( let@ ) = ( @@ )
let spf = Printf.sprintf let spf = Printf.sprintf
let pf = Printf.printf let pf = Printf.printf
let verbose = ref false let verbose = ref false
let reset_line = "\x1b[2K\r"
let n_loops_per_task = 100
let main ~runner:_ ~port ~unix_sock ~n ~n_conn () =
Sys.set_signal Sys.sigpipe Sys.Signal_ignore;
let main ~port ~unix_sock ~n ~n_conn () =
pf "connect on %s n=%d n_conn=%d\n%!" pf "connect on %s n=%d n_conn=%d\n%!"
(if unix_sock = "" then (if unix_sock = "" then
spf "localhost:%d" port spf "localhost:%d" port
@ -24,57 +29,91 @@ let main ~port ~unix_sock ~n ~n_conn () =
Unix.ADDR_UNIX unix_sock Unix.ADDR_UNIX unix_sock
in in
let remaining = Atomic.make n in
let all_done = Atomic.make 0 in
Printf.printf "connecting to port %d\n%!" port; Printf.printf "connecting to port %d\n%!" port;
let rec run_task () = let all_done = Atomic.make false in
let n = Atomic.fetch_and_add remaining (-1) in let n_queries = Atomic.make 0 in
(* limit simultaneous number of connections *)
let sem = Sem.make n_conn in
let n_active_conns = Atomic.make 0 in
let progress_loop () =
while not (Atomic.get all_done) do
let n_queries = Atomic.get n_queries in
let n_conns = Atomic.get n_active_conns in
(* progress *)
Printf.printf "%sdone %d queries, %d active connections%!" reset_line
n_queries n_conns;
Trace.counter_int ~level:Info "n-conns" n_conns;
Trace.counter_int ~level:Info "n-queries" n_queries;
let gc = Gc.quick_stat () in
Trace.counter_int ~level:Info "gc.major" gc.major_collections;
Trace.counter_int ~level:Info "gc.minor" gc.minor_collections;
Trace.counter_int ~level:Info "gc.heap-size" (gc.heap_words * 64);
Thread.delay 0.2
done
in
ignore (Thread.create progress_loop () : Thread.t);
let run_task () =
let _task_sp = let _task_sp =
Trace.enter_manual_toplevel_span ~__FILE__ ~__LINE__ "run-task" Trace.enter_manual_toplevel_span ~__FILE__ ~__LINE__ "run-task"
~data:(fun () -> [ "n", `Int n ])
in in
if n > 0 then ( Sem.acquire sem;
( (* let@ _sp = Trace.with_span ~__FILE__ ~__LINE__ "connect.client" in *) ( IO.Net_client.with_connect addr @@ fun ic oc ->
IO.Net_client.with_connect addr Atomic.incr n_active_conns;
@@ fun ic oc -> let buf = Bytes.create 32 in
let buf = Bytes.create 32 in
for _j = 1 to 100 do for _j = 1 to n_loops_per_task do
let _sp = (*let _sp =
Trace.enter_manual_sub_span ~parent:(Trace.ctx_of_span _task_sp) Trace.enter_manual_sub_span ~parent:_task_sp ~__FILE__ ~__LINE__
~__FILE__ ~__LINE__ "write.loop" ~data:(fun () -> "write.loop" ~data:(fun () -> [ "iter", `Int _j ])
[ "iter", `Int _j ]) in*)
in Atomic.incr n_queries;
Iostream.Out.output_string oc "hello";
Iostream.Out_buf.flush oc;
(* read back what we wrote *) Iostream.Out.output_string oc "hello";
Iostream.In.really_input ic buf 0 (String.length "hello"); Iostream.Out_buf.flush oc;
Trace.exit_manual_span _sp;
F.yield () (* read back what we wrote *)
done ); Iostream.In.really_input ic buf 0 (String.length "hello");
(* Trace.exit_manual_span _sp; *)
F.yield ()
done;
Atomic.decr n_active_conns;
Sem.release sem );
(* run another task *)
F.spawn_ignore run_task
) else (
(* if we're the last to exit, resolve the promise *)
let n_already_done = Atomic.fetch_and_add all_done 1 in
if n_already_done = n_conn - 1 then Printf.printf "all done\n%!"
);
Trace.exit_manual_span _task_sp Trace.exit_manual_span _task_sp
in in
let t_start = Mtime_clock.now () in
(* start the first [n_conn] tasks *) (* start the first [n_conn] tasks *)
let fibers = List.init n_conn (fun _ -> F.spawn run_task) in let fibers = List.init (n * n_conn) (fun _ -> F.spawn run_task) in
List.iter F.await fibers; List.iter F.await fibers;
Atomic.set all_done true;
let t_stop = Mtime_clock.now () in
let elapsed_s =
(Mtime.span t_start t_stop |> Mtime.Span.to_uint64_ns |> Int64.to_float)
*. 1e-9
in
(* exit when [fut_exit] is resolved *) (* exit when [fut_exit] is resolved *)
Printf.printf "done with main\n%!" Printf.printf
"%sdone with main (time=%.4fs, n queries=%d, expect=%d, %.3f req/s)\n%!"
reset_line elapsed_s (Atomic.get n_queries)
(n * n_conn * n_loops_per_task)
(float (Atomic.get n_queries) /. elapsed_s)
let () = let () =
let@ () = Trace_tef.with_setup () in let@ () = Trace_tef.with_setup () in
Trace.set_current_level Info;
Trace.set_thread_name "main"; Trace.set_thread_name "main";
let port = ref 1234 in let port = ref 1234 in
@ -96,5 +135,5 @@ let () =
let@ () = let@ () =
Nanoev_picos.Background_thread.with_setup (Nanoev_posix.create ()) Nanoev_picos.Background_thread.with_setup (Nanoev_posix.create ())
in in
F.main @@ fun _runner -> F.main @@ fun runner ->
main ~port:!port ~unix_sock:!unix_sock ~n:!n ~n_conn:!n_conn () main ~runner ~port:!port ~unix_sock:!unix_sock ~n:!n ~n_conn:!n_conn ()

View file

@ -8,13 +8,16 @@ let ( let@ ) = ( @@ )
let pf = Printf.printf let pf = Printf.printf
let spf = Printf.sprintf let spf = Printf.sprintf
let verbose = ref false let verbose = ref false
let n_reply_response = Atomic.make 0
let str_of_sockaddr = function let str_of_sockaddr = function
| Unix.ADDR_UNIX s -> s | Unix.ADDR_UNIX s -> s
| Unix.ADDR_INET (addr, port) -> | Unix.ADDR_INET (addr, port) ->
spf "%s:%d" (Unix.string_of_inet_addr addr) port spf "%s:%d" (Unix.string_of_inet_addr addr) port
let main ~port ~unix_sock ~runner () = let main ~port ~unix_sock ~max_conns ~runner () =
Sys.set_signal Sys.sigpipe Sys.Signal_ignore;
pf "serve on %s\n%!" pf "serve on %s\n%!"
(if unix_sock = "" then (if unix_sock = "" then
spf "localhost:%d" port spf "localhost:%d" port
@ -24,12 +27,15 @@ let main ~port ~unix_sock ~runner () =
let addr = let addr =
if unix_sock = "" then if unix_sock = "" then
Unix.ADDR_INET (Unix.inet_addr_loopback, port) Unix.ADDR_INET (Unix.inet_addr_loopback, port)
else else (
(* remove leftover unix socket file, if any *)
(try Sys.remove unix_sock with _ -> ());
Unix.ADDR_UNIX unix_sock Unix.ADDR_UNIX unix_sock
)
in in
let server = let server =
IO.Net_server.establish addr IO.Net_server.establish ?max_connections:max_conns addr
~spawn:(fun f -> Moonpool.spawn ~on:runner f) ~spawn:(fun f -> Moonpool.spawn ~on:runner f)
~client_handler:(fun client_addr ic oc -> ~client_handler:(fun client_addr ic oc ->
let _sp = let _sp =
@ -42,31 +48,63 @@ let main ~port ~unix_sock ~runner () =
let buf = Bytes.create 256 in let buf = Bytes.create 256 in
let continue = ref true in let continue = ref true in
while !continue do while !continue do
let n = Iostream.In.input ic buf 0 (Bytes.length buf) in match Iostream.In.input ic buf 0 (Bytes.length buf) with
if n = 0 then | exception exn ->
continue := false continue := false;
else ( Printf.eprintf "error in client handler: %s\n%!"
(Printexc.to_string exn)
| 0 -> continue := false
| n ->
Atomic.incr n_reply_response;
Iostream.Out.output oc buf 0 n; Iostream.Out.output oc buf 0 n;
Iostream.Out_buf.flush oc Iostream.Out_buf.flush oc;
) Picos.Fiber.yield ()
done; done;
Trace.exit_manual_span _sp; Trace.exit_manual_span _sp;
if !verbose then if !verbose then
pf "done with client on %s\n%!" (str_of_sockaddr client_addr)) pf "done with client on %s\n%!" (str_of_sockaddr client_addr))
in in
Printf.printf "max number of connections: %d\n%!"
(IO.Net_server.max_connections server);
if Trace.enabled () then
ignore
(Thread.create
(fun () ->
while IO.Net_server.running server do
Trace.counter_int ~level:Info "n-conns"
(IO.Net_server.n_active_connections server);
let gc = Gc.quick_stat () in
Trace.counter_int ~level:Info "gc.major" gc.major_collections;
Trace.counter_int ~level:Info "gc.minor" gc.minor_collections;
Trace.counter_int ~level:Info "n-reply-response"
(Atomic.get n_reply_response);
Trace.counter_int ~level:Info "gc.heap-size" (gc.heap_words * 64);
Thread.delay 0.2
done)
()
: Thread.t);
IO.Net_server.join server; IO.Net_server.join server;
IO.Net_server.shutdown server; IO.Net_server.shutdown server;
print_endline "exit" print_endline "exit"
let () = let () =
let@ () = Trace_tef.with_setup () in let@ () = Trace_tef.with_setup () in
Trace.set_current_level Info;
let port = ref 1234 in let port = ref 1234 in
let unix_sock = ref "" in let unix_sock = ref "" in
let max_conns = ref None in
let opts = let opts =
[ [
"-p", Arg.Set_int port, " port"; "-p", Arg.Set_int port, " port";
"--unix", Arg.Set_string unix_sock, " unix socket"; "--unix", Arg.Set_string unix_sock, " unix socket";
( "--max-conns",
Arg.Int (fun i -> max_conns := Some i),
" max number of connections" );
"-v", Arg.Set verbose, " verbose"; "-v", Arg.Set verbose, " verbose";
] ]
|> Arg.align |> Arg.align
@ -76,4 +114,5 @@ let () =
let@ () = let@ () =
Nanoev_picos.Background_thread.with_setup (Nanoev_posix.create ()) Nanoev_picos.Background_thread.with_setup (Nanoev_posix.create ())
in in
F.main @@ fun runner -> main ~port:!port ~unix_sock:!unix_sock ~runner () F.main @@ fun runner ->
main ~port:!port ~unix_sock:!unix_sock ~max_conns:!max_conns ~runner ()