Files
agentic-kvc/v2/exp_a_tier_latency/results/rdma.json
Gahow Wang dc8e6dd5a8 v2 exp(a): add remote KV-store (RDMA) tier
Extends the hit-latency microbench to a 4th tier: a remote global-KV-store
hit over RDMA, the Mooncake-Store mechanism. Two kv_both MooncakeConnector
instances (run_rdma.sh); for each prefix length, instance B serves the
request by pulling instance A's cached prefix over RDMA (do_remote_prefill,
via microbench/fresh_setup/mb2_kv_transfer.py) instead of recomputing -- the
timed pull is the remote-hit latency.

Result (TTFT p50, 11 reps): strict tier ordering
GPU(HBM) < CPU(local DRAM) < remote-RDMA-store << miss, gaps growing with
context. At 64k: GPU 0.11s, CPU 0.27s, RDMA 0.97s, miss 15.2s -> miss/RDMA
15.8x, RDMA/CPU 3.6x, CPU/GPU 2.4x. So a global RDMA store is a real win
over recompute (the blog's 46x) but pays the NIC tax (~5-7 GB/s effective)
and sits a tier below local CPU and two below GPU -- reinforcing
GPU-hit-first. README + figure updated to four tiers.

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
2026-05-30 12:48:37 +08:00

1013 lines
34 KiB
JSON

{
"model": "/home/admin/cpfs/wjh/models/Qwen/Qwen3-Coder-30B-A3B-Instruct",
"kv_bytes_per_token": 98304,
"src_host": "127.0.0.1",
"src_port": 8000,
"dst_host": "127.0.0.1",
"dst_port": 8001,
"config_label": "rdma-intra-node",
"raw": [
{
"input_tokens": 1024,
"session": "42945df8aa2947dea7856aec043953c4",
"t_step1_client_unix": 1780113654.6796737,
"t_step2_client_unix": 1780113655.3103006,
"t_step2_end_unix": 1780113655.7742817,
"t_prefill_s": 0.630586825980572,
"t_transfer_s": 0.46393222000915557,
"t_followup_s": 0.09882230299990624,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "574133556117480ea4433033ee16ef7d",
"t_step1_client_unix": 1780113655.8735948,
"t_step2_client_unix": 1780113655.9512424,
"t_step2_end_unix": 1780113656.0120106,
"t_prefill_s": 0.07761351700173691,
"t_transfer_s": 0.06073612501495518,
"t_followup_s": 0.047241352003766224,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "74de5f623dda4e3ab9bef978237c058a",
"t_step1_client_unix": 1780113656.0597408,
"t_step2_client_unix": 1780113656.136515,
"t_step2_end_unix": 1780113656.1980197,
"t_prefill_s": 0.07674612698610872,
"t_transfer_s": 0.06146429298678413,
"t_followup_s": 0.04567234200658277,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "ae5339f421184215a06ee0406d70c6db",
"t_step1_client_unix": 1780113656.2442205,
"t_step2_client_unix": 1780113656.3202548,
"t_step2_end_unix": 1780113656.3829181,
"t_prefill_s": 0.07600510100019164,
"t_transfer_s": 0.06263405701611191,
"t_followup_s": 0.045199740008683875,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "108018399ef64e66a9780f032bd5f1d2",
"t_step1_client_unix": 1780113656.4285796,
"t_step2_client_unix": 1780113656.5039103,
"t_step2_end_unix": 1780113656.5650918,
"t_prefill_s": 0.07530323401442729,
"t_transfer_s": 0.06115360799594782,
"t_followup_s": 0.047417668014531955,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "4f147b3685f348599ee6d31f592d3d68",
"t_step1_client_unix": 1780113656.613002,
"t_step2_client_unix": 1780113656.688678,
"t_step2_end_unix": 1780113656.7499766,
"t_prefill_s": 0.07563983497675508,
"t_transfer_s": 0.061254432977875695,
"t_followup_s": 0.05035233299713582,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "7185314a355d4fb1a7be63667bb5d532",
"t_step1_client_unix": 1780113656.8008058,
"t_step2_client_unix": 1780113656.876437,
"t_step2_end_unix": 1780113656.9365327,
"t_prefill_s": 0.0756044389854651,
"t_transfer_s": 0.0600691509898752,
"t_followup_s": 0.04694663899135776,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "a75befce806b49ca8b4bc839d398a836",
"t_step1_client_unix": 1780113656.9840212,
"t_step2_client_unix": 1780113657.0596485,
"t_step2_end_unix": 1780113657.121014,
"t_prefill_s": 0.07559421702171676,
"t_transfer_s": 0.061336473998380825,
"t_followup_s": 0.04504776999237947,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "5eed050534974087b585636f8626d36b",
"t_step1_client_unix": 1780113657.1665282,
"t_step2_client_unix": 1780113657.2422314,
"t_step2_end_unix": 1780113657.3042758,
"t_prefill_s": 0.07567335499334149,
"t_transfer_s": 0.062015656993025914,
"t_followup_s": 0.044170998997287825,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "38ad990f52254bf39487a0ba49780d8b",
"t_step1_client_unix": 1780113657.3489134,
"t_step2_client_unix": 1780113657.425841,
"t_step2_end_unix": 1780113657.485667,
"t_prefill_s": 0.07690018997527659,
"t_transfer_s": 0.05979751900304109,
"t_followup_s": 0.047392740001669154,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 1024,
"session": "d01e4123b1b54d5e8578ec06bcb198f0",
"t_step1_client_unix": 1780113657.533507,
"t_step2_client_unix": 1780113657.6109633,
"t_step2_end_unix": 1780113657.673547,
"t_prefill_s": 0.07741417599027045,
"t_transfer_s": 0.0625474060070701,
"t_followup_s": 0.04817350400844589,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "62ff1956604d459e84052715e7ed8ba7",
"t_step1_client_unix": 1780113657.7226295,
"t_step2_client_unix": 1780113657.9077578,
"t_step2_end_unix": 1780113657.985153,
"t_prefill_s": 0.18509869498666376,
"t_transfer_s": 0.07735455100191757,
"t_followup_s": 0.046408719004830346,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "ec7b97db9dae4bc888c91b65c5efabba",
"t_step1_client_unix": 1780113658.0324116,
"t_step2_client_unix": 1780113658.1642551,
"t_step2_end_unix": 1780113658.2397475,
"t_prefill_s": 0.1318151500017848,
"t_transfer_s": 0.07546432898379862,
"t_followup_s": 0.04965048600570299,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "082ed4f2baec4107acf0dbebabbcf32f",
"t_step1_client_unix": 1780113658.2902431,
"t_step2_client_unix": 1780113658.4218829,
"t_step2_end_unix": 1780113658.494315,
"t_prefill_s": 0.1316128930193372,
"t_transfer_s": 0.07240396799170412,
"t_followup_s": 0.04556456100544892,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "890e243bc7f742c19a899cd19160e6ce",
"t_step1_client_unix": 1780113658.540683,
"t_step2_client_unix": 1780113658.6717823,
"t_step2_end_unix": 1780113658.7469842,
"t_prefill_s": 0.13105839598574676,
"t_transfer_s": 0.07517452799947932,
"t_followup_s": 0.04641962700407021,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "e4ca5aef90be4b45bc2222ad3c637581",
"t_step1_client_unix": 1780113658.7943006,
"t_step2_client_unix": 1780113658.9255776,
"t_step2_end_unix": 1780113659.0016084,
"t_prefill_s": 0.13125143098295666,
"t_transfer_s": 0.07600446898140945,
"t_followup_s": 0.04827121601556428,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "64e21909088043e98e7532361d747128",
"t_step1_client_unix": 1780113659.0507092,
"t_step2_client_unix": 1780113659.1820831,
"t_step2_end_unix": 1780113659.2554085,
"t_prefill_s": 0.13133879398810677,
"t_transfer_s": 0.07329847698565573,
"t_followup_s": 0.050039641006151214,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "8d3cb21a4f1a4daa94d31a48d969188a",
"t_step1_client_unix": 1780113659.3063629,
"t_step2_client_unix": 1780113659.437705,
"t_step2_end_unix": 1780113659.5105412,
"t_prefill_s": 0.13131436699768528,
"t_transfer_s": 0.07280980699579231,
"t_followup_s": 0.045990444981725886,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "a949f45bf00e4b6f9e282a48d2f54ae9",
"t_step1_client_unix": 1780113659.5574262,
"t_step2_client_unix": 1780113659.6894715,
"t_step2_end_unix": 1780113659.763246,
"t_prefill_s": 0.13201635199948214,
"t_transfer_s": 0.07374655400053598,
"t_followup_s": 0.04740602700621821,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "a1350bc4af1d4a95a8d7870aac6c30d4",
"t_step1_client_unix": 1780113659.8115327,
"t_step2_client_unix": 1780113659.94307,
"t_step2_end_unix": 1780113660.0165753,
"t_prefill_s": 0.13151001499500126,
"t_transfer_s": 0.07347742197453044,
"t_followup_s": 0.054559190990403295,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "0cbada3f1cf34ad98150c7cd05df9e81",
"t_step1_client_unix": 1780113660.0719872,
"t_step2_client_unix": 1780113660.2065787,
"t_step2_end_unix": 1780113660.2800386,
"t_prefill_s": 0.13456111898995005,
"t_transfer_s": 0.07343242000206374,
"t_followup_s": 0.04842582900892012,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 2048,
"session": "086166dcac9f4cf587152003a665dd6d",
"t_step1_client_unix": 1780113660.3293216,
"t_step2_client_unix": 1780113660.4612148,
"t_step2_end_unix": 1780113660.5348513,
"t_prefill_s": 0.13186514400877059,
"t_transfer_s": 0.07360914399032481,
"t_followup_s": 0.04667951900046319,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "e16840958b4e42378aa2f474224f7c47",
"t_step1_client_unix": 1780113660.5832062,
"t_step2_client_unix": 1780113660.8487082,
"t_step2_end_unix": 1780113660.9490895,
"t_prefill_s": 0.26547358598327264,
"t_transfer_s": 0.10033372900215909,
"t_followup_s": 0.04891211100039072,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "8119bfc1b947496e8434bc2dd780ddf2",
"t_step1_client_unix": 1780113660.9995859,
"t_step2_client_unix": 1780113661.2600472,
"t_step2_end_unix": 1780113661.3582017,
"t_prefill_s": 0.2604305710119661,
"t_transfer_s": 0.09812465400318615,
"t_followup_s": 0.0544344789814204,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "cb517bfea1ac46058ffbf918582c74d4",
"t_step1_client_unix": 1780113661.414242,
"t_step2_client_unix": 1780113661.674581,
"t_step2_end_unix": 1780113661.7718108,
"t_prefill_s": 0.2603055170038715,
"t_transfer_s": 0.09719818198936991,
"t_followup_s": 0.0503446809889283,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "89eabc4ad0534b4a934b1e852050c6f5",
"t_step1_client_unix": 1780113661.823718,
"t_step2_client_unix": 1780113662.0844855,
"t_step2_end_unix": 1780113662.1830976,
"t_prefill_s": 0.2607354299980216,
"t_transfer_s": 0.09858069600886665,
"t_followup_s": 0.04950785997789353,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "b644572bba324d829a249aaeeb22ee54",
"t_step1_client_unix": 1780113662.2342994,
"t_step2_client_unix": 1780113662.4946663,
"t_step2_end_unix": 1780113662.5922973,
"t_prefill_s": 0.26033472700510174,
"t_transfer_s": 0.09760292299324647,
"t_followup_s": 0.05018276898772456,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "01faaeab31bd4feb9b27bd03e5ee75b1",
"t_step1_client_unix": 1780113662.6441038,
"t_step2_client_unix": 1780113662.9044588,
"t_step2_end_unix": 1780113663.0019135,
"t_prefill_s": 0.26032789101009257,
"t_transfer_s": 0.09742468598415144,
"t_followup_s": 0.0510591670172289,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "87a72e6be33b46c29035ea566f1c79cc",
"t_step1_client_unix": 1780113663.0545735,
"t_step2_client_unix": 1780113663.315426,
"t_step2_end_unix": 1780113663.415479,
"t_prefill_s": 0.2608224749856163,
"t_transfer_s": 0.10002275300212204,
"t_followup_s": 0.05161238700384274,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "28b5629f8b04451d9404f5dd15b860a0",
"t_step1_client_unix": 1780113663.4687288,
"t_step2_client_unix": 1780113663.7299144,
"t_step2_end_unix": 1780113663.8311837,
"t_prefill_s": 0.26115050600492395,
"t_transfer_s": 0.10123400299926288,
"t_followup_s": 0.04951982302009128,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "ed022f1b155c4fe191032d8c917124c5",
"t_step1_client_unix": 1780113663.882292,
"t_step2_client_unix": 1780113664.1436367,
"t_step2_end_unix": 1780113664.2428293,
"t_prefill_s": 0.2613153549900744,
"t_transfer_s": 0.0991641900036484,
"t_followup_s": 0.05027229798724875,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "cb09310c2178452cb2ecda3f4c4f4642",
"t_step1_client_unix": 1780113664.2947013,
"t_step2_client_unix": 1780113664.5561187,
"t_step2_end_unix": 1780113664.6587803,
"t_prefill_s": 0.2613755869970191,
"t_transfer_s": 0.10260535500128753,
"t_followup_s": 0.054842573998030275,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 4096,
"session": "26a14c40b7424663ad5bf012e04b0d48",
"t_step1_client_unix": 1780113664.7152772,
"t_step2_client_unix": 1780113664.9784563,
"t_step2_end_unix": 1780113665.0804708,
"t_prefill_s": 0.2631347790011205,
"t_transfer_s": 0.10197760400478728,
"t_followup_s": 0.05454107699915767,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "28aa179a55b04b6e826df76997e49965",
"t_step1_client_unix": 1780113665.1381943,
"t_step2_client_unix": 1780113665.725791,
"t_step2_end_unix": 1780113665.8781552,
"t_prefill_s": 0.587549192016013,
"t_transfer_s": 0.15232679099426605,
"t_followup_s": 0.05964333200245164,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "c947ef89013d420faf4784bd0e0d5532",
"t_step1_client_unix": 1780113665.9409757,
"t_step2_client_unix": 1780113666.5288377,
"t_step2_end_unix": 1780113666.677537,
"t_prefill_s": 0.5878257739823312,
"t_transfer_s": 0.14866453199647367,
"t_followup_s": 0.05501791799906641,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "c71d8f7e44454f208391211b91409f34",
"t_step1_client_unix": 1780113666.7356484,
"t_step2_client_unix": 1780113667.3223348,
"t_step2_end_unix": 1780113667.475447,
"t_prefill_s": 0.5866534260276239,
"t_transfer_s": 0.15308237000135705,
"t_followup_s": 0.06039133798913099,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "d2f1c3b53ea8409ca49d5b6bcc7bea2a",
"t_step1_client_unix": 1780113667.5389588,
"t_step2_client_unix": 1780113668.1259756,
"t_step2_end_unix": 1780113668.2758486,
"t_prefill_s": 0.5869663549819961,
"t_transfer_s": 0.14983698999276385,
"t_followup_s": 0.05716336300247349,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "2b5edf5a21cc44f5929a722322d89d52",
"t_step1_client_unix": 1780113668.3363352,
"t_step2_client_unix": 1780113668.9260604,
"t_step2_end_unix": 1780113669.079605,
"t_prefill_s": 0.5896447559935041,
"t_transfer_s": 0.15350710399798118,
"t_followup_s": 0.05581469400203787,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "3d29eed43ca644ab998a89ae996521a0",
"t_step1_client_unix": 1780113669.1385791,
"t_step2_client_unix": 1780113669.7260985,
"t_step2_end_unix": 1780113669.8774042,
"t_prefill_s": 0.5874853960121982,
"t_transfer_s": 0.15127158901304938,
"t_followup_s": 0.057220480986870825,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "657303232eec4008abdc80cb69e27508",
"t_step1_client_unix": 1780113669.937695,
"t_step2_client_unix": 1780113670.5248249,
"t_step2_end_unix": 1780113670.6737514,
"t_prefill_s": 0.5870937670115381,
"t_transfer_s": 0.14888012100709602,
"t_followup_s": 0.059168930019950494,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "3560bebf9f7d4138b33cd30dd16aacfd",
"t_step1_client_unix": 1780113670.7366655,
"t_step2_client_unix": 1780113671.3249788,
"t_step2_end_unix": 1780113671.477699,
"t_prefill_s": 0.5882545940112323,
"t_transfer_s": 0.1526875200215727,
"t_followup_s": 0.06097331500495784,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "a8bb4afeb02b4ff99eac92226f0d5f58",
"t_step1_client_unix": 1780113671.5417728,
"t_step2_client_unix": 1780113672.1291869,
"t_step2_end_unix": 1780113672.280071,
"t_prefill_s": 0.5873805590090342,
"t_transfer_s": 0.15085255599115044,
"t_followup_s": 0.057901772001059726,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "68c32fca0260409c8a632ff617513587",
"t_step1_client_unix": 1780113672.3411584,
"t_step2_client_unix": 1780113672.9282277,
"t_step2_end_unix": 1780113673.0856972,
"t_prefill_s": 0.5870382410066668,
"t_transfer_s": 0.15743795299204066,
"t_followup_s": 0.05747991299722344,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 8192,
"session": "b95e321ef53e4383b302c2db7ebcca73",
"t_step1_client_unix": 1780113673.1462142,
"t_step2_client_unix": 1780113673.7336242,
"t_step2_end_unix": 1780113673.8830152,
"t_prefill_s": 0.5873774820065591,
"t_transfer_s": 0.149357913993299,
"t_followup_s": 0.05543989400030114,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "0979f595e2b44f3285b4242fda1ee3df",
"t_step1_client_unix": 1780113673.9444556,
"t_step2_client_unix": 1780113675.5027504,
"t_step2_end_unix": 1780113675.7646046,
"t_prefill_s": 1.558238979021553,
"t_transfer_s": 0.2618165699823294,
"t_followup_s": 0.07395038701361045,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "14c8c786b4a846149945ea141f705863",
"t_step1_client_unix": 1780113675.8444831,
"t_step2_client_unix": 1780113677.3960428,
"t_step2_end_unix": 1780113677.6459343,
"t_prefill_s": 1.5515160829818342,
"t_transfer_s": 0.249856763985008,
"t_followup_s": 0.06939491498633288,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "31d3cb21ac8d4ced89ab33ce4fb7589b",
"t_step1_client_unix": 1780113677.721303,
"t_step2_client_unix": 1780113679.2696404,
"t_step2_end_unix": 1780113679.5167441,
"t_prefill_s": 1.548295495013008,
"t_transfer_s": 0.24705595700652339,
"t_followup_s": 0.06773578398860991,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "a9d5cbce333f4c21afaa8bdbeab31bf3",
"t_step1_client_unix": 1780113679.5905588,
"t_step2_client_unix": 1780113681.1353347,
"t_step2_end_unix": 1780113681.37527,
"t_prefill_s": 1.5447358399978839,
"t_transfer_s": 0.23989686000277288,
"t_followup_s": 0.06704856699798256,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "e58110ad40cc46e0b15b222ebf0cbe86",
"t_step1_client_unix": 1780113681.4499586,
"t_step2_client_unix": 1780113682.9963198,
"t_step2_end_unix": 1780113683.2421525,
"t_prefill_s": 1.5463133199955337,
"t_transfer_s": 0.2457908419892192,
"t_followup_s": 0.06450486500398256,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "fbec8cdaac0c4ef8a028c68e49311b9a",
"t_step1_client_unix": 1780113683.3127434,
"t_step2_client_unix": 1780113684.8600428,
"t_step2_end_unix": 1780113685.106106,
"t_prefill_s": 1.5472517309826799,
"t_transfer_s": 0.2460192689904943,
"t_followup_s": 0.06439224901259877,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "7598055ceec1423d9b1d88c6200a1c21",
"t_step1_client_unix": 1780113685.1769145,
"t_step2_client_unix": 1780113686.732929,
"t_step2_end_unix": 1780113687.0007024,
"t_prefill_s": 1.5559708710061386,
"t_transfer_s": 0.2677336060150992,
"t_followup_s": 0.06560050300322473,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "f0512699fd10499ebb2421087d5138cc",
"t_step1_client_unix": 1780113687.0725183,
"t_step2_client_unix": 1780113688.6251225,
"t_step2_end_unix": 1780113688.9931352,
"t_prefill_s": 1.5525663039879873,
"t_transfer_s": 0.3679773240000941,
"t_followup_s": 0.07065863799653016,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "818876ee380f4a8f9258ddff7554e718",
"t_step1_client_unix": 1780113689.0700693,
"t_step2_client_unix": 1780113690.6202304,
"t_step2_end_unix": 1780113690.976204,
"t_prefill_s": 1.5501246719795745,
"t_transfer_s": 0.3559349720017053,
"t_followup_s": 0.06182111200178042,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "440b924a8dc44a57a60a8d8790b83425",
"t_step1_client_unix": 1780113691.0440626,
"t_step2_client_unix": 1780113692.600122,
"t_step2_end_unix": 1780113692.9298801,
"t_prefill_s": 1.5560206689988263,
"t_transfer_s": 0.3297227440052666,
"t_followup_s": 0.06168726898613386,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 16384,
"session": "bf7c1545c5a048b497c4934e849d9b77",
"t_step1_client_unix": 1780113692.9983332,
"t_step2_client_unix": 1780113694.549985,
"t_step2_end_unix": 1780113694.902612,
"t_prefill_s": 1.5515996039903257,
"t_transfer_s": 0.3525931639887858,
"t_followup_s": 0.06388000200968236,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "3ea99ff99c034fadaae11e0a18cbcd12",
"t_step1_client_unix": 1780113694.978447,
"t_step2_client_unix": 1780113699.5872533,
"t_step2_end_unix": 1780113700.3202353,
"t_prefill_s": 4.608766862016637,
"t_transfer_s": 0.7329461979970802,
"t_followup_s": 0.08203631298965774,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "160f663843cc4da4a4c1968620e74bbe",
"t_step1_client_unix": 1780113700.4144092,
"t_step2_client_unix": 1780113705.0188375,
"t_step2_end_unix": 1780113705.7512634,
"t_prefill_s": 4.604390962980688,
"t_transfer_s": 0.7323910310224164,
"t_followup_s": 0.08162634400650859,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "44be5da3d4d9421ea682b02af879f038",
"t_step1_client_unix": 1780113705.8446133,
"t_step2_client_unix": 1780113710.446565,
"t_step2_end_unix": 1780113711.1756835,
"t_prefill_s": 4.60191403501085,
"t_transfer_s": 0.7290820410125889,
"t_followup_s": 0.08314321600482799,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "76fb5e99bda74949ab48c2a806796e20",
"t_step1_client_unix": 1780113711.2712142,
"t_step2_client_unix": 1780113715.8831358,
"t_step2_end_unix": 1780113716.605932,
"t_prefill_s": 4.611884240992367,
"t_transfer_s": 0.7227587410015985,
"t_followup_s": 0.08411424100631848,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "2698392640df43d98c5b88ec14603ab4",
"t_step1_client_unix": 1780113716.7025611,
"t_step2_client_unix": 1780113721.3066654,
"t_step2_end_unix": 1780113721.9864836,
"t_prefill_s": 4.60406794998562,
"t_transfer_s": 0.6797809940180741,
"t_followup_s": 0.0797950770065654,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "3a317d68c23d48a6b464cbb7471f1b15",
"t_step1_client_unix": 1780113722.078643,
"t_step2_client_unix": 1780113726.683183,
"t_step2_end_unix": 1780113727.3790748,
"t_prefill_s": 4.604500039014965,
"t_transfer_s": 0.6958539690240286,
"t_followup_s": 0.0791638570080977,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "ef55cea31d1d4c9faa3095c6572b3158",
"t_step1_client_unix": 1780113727.4699852,
"t_step2_client_unix": 1780113732.0734339,
"t_step2_end_unix": 1780113732.6349242,
"t_prefill_s": 4.603411051008152,
"t_transfer_s": 0.5614562759874389,
"t_followup_s": 0.07942970001022331,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "51111cf4420040aabc709ec95b69299c",
"t_step1_client_unix": 1780113732.726002,
"t_step2_client_unix": 1780113737.3279588,
"t_step2_end_unix": 1780113737.768525,
"t_prefill_s": 4.6019097800017335,
"t_transfer_s": 0.4405296350014396,
"t_followup_s": 0.07934816100168973,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "a4218f26139940b7a63c574c58c0cc78",
"t_step1_client_unix": 1780113737.8595614,
"t_step2_client_unix": 1780113742.4654746,
"t_step2_end_unix": 1780113742.9027445,
"t_prefill_s": 4.605869954015361,
"t_transfer_s": 0.43722251401050016,
"t_followup_s": 0.08265988298808224,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "ef166eea7c0241a0b6683c9b9be98e26",
"t_step1_client_unix": 1780113742.9973059,
"t_step2_client_unix": 1780113747.60252,
"t_step2_end_unix": 1780113748.0344896,
"t_prefill_s": 4.605175297008827,
"t_transfer_s": 0.43193520401837304,
"t_followup_s": 0.08029142298619263,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 32768,
"session": "510b2beab0934d4191ce4c4b4fb8bb20",
"t_step1_client_unix": 1780113748.1287684,
"t_step2_client_unix": 1780113752.728051,
"t_step2_end_unix": 1780113753.1700265,
"t_prefill_s": 4.599246629979461,
"t_transfer_s": 0.4419387440138962,
"t_followup_s": 0.08067455000127666,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "d51ed2927db344808d34fac0c09d5d29",
"t_step1_client_unix": 1780113753.274224,
"t_step2_client_unix": 1780113768.560607,
"t_step2_end_unix": 1780113769.367652,
"t_prefill_s": 15.286344999010907,
"t_transfer_s": 0.8070085129875224,
"t_followup_s": 0.11767313402378932,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "a7af94a6de9547b4b943c986b7e6f001",
"t_step1_client_unix": 1780113769.5093763,
"t_step2_client_unix": 1780113784.8304524,
"t_step2_end_unix": 1780113785.7471335,
"t_prefill_s": 15.31890859498526,
"t_transfer_s": 0.9138955899979919,
"t_followup_s": 0.1327741070126649,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "48300f75fbb347e6859a6a0585dcc04e",
"t_step1_client_unix": 1780113785.9058163,
"t_step2_client_unix": 1780113801.193769,
"t_step2_end_unix": 1780113802.842876,
"t_prefill_s": 15.287883285986027,
"t_transfer_s": 1.6490699610149022,
"t_followup_s": 0.10919595797895454,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "c61d6f9f29024284b284f54d907d5fc9",
"t_step1_client_unix": 1780113802.975333,
"t_step2_client_unix": 1780113818.271725,
"t_step2_end_unix": 1780113820.8995724,
"t_prefill_s": 15.296337511012098,
"t_transfer_s": 2.6278096020105295,
"t_followup_s": 0.12072346499189734,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "52ef9ee529ef44d7b6140535833c05a3",
"t_step1_client_unix": 1780113821.0437183,
"t_step2_client_unix": 1780113836.3338494,
"t_step2_end_unix": 1780113838.7353442,
"t_prefill_s": 15.290092708019074,
"t_transfer_s": 2.4014571599836927,
"t_followup_s": 0.11354603400104679,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "99730c3c4684499286c1831c027e3b39",
"t_step1_client_unix": 1780113838.8726406,
"t_step2_client_unix": 1780113854.1566162,
"t_step2_end_unix": 1780113855.7166855,
"t_prefill_s": 15.283936669002287,
"t_transfer_s": 1.560034744994482,
"t_followup_s": 0.11488680701586418,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "6f072e8c09734c2cb3ff771c538b80c5",
"t_step1_client_unix": 1780113855.8550732,
"t_step2_client_unix": 1780113871.1431854,
"t_step2_end_unix": 1780113872.1094413,
"t_prefill_s": 15.288075597025454,
"t_transfer_s": 0.9662203160114586,
"t_followup_s": 0.11588297100388445,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "6bd7c6a2a8614f0a8ab32ad7b6fdc6da",
"t_step1_client_unix": 1780113872.2491899,
"t_step2_client_unix": 1780113887.532155,
"t_step2_end_unix": 1780113888.451564,
"t_prefill_s": 15.282926287996816,
"t_transfer_s": 0.9193728909885976,
"t_followup_s": 0.11174739900161512,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "03936c26f94947539251b7a8fe429eb5",
"t_step1_client_unix": 1780113888.5874689,
"t_step2_client_unix": 1780113903.8650937,
"t_step2_end_unix": 1780113904.6822457,
"t_prefill_s": 15.277585066010943,
"t_transfer_s": 0.8171155720192473,
"t_followup_s": 0.11233539402019233,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "fbef8e1b6fd94f28b8e0edbc86135cf5",
"t_step1_client_unix": 1780113904.8176143,
"t_step2_client_unix": 1780113920.1035478,
"t_step2_end_unix": 1780113921.0166585,
"t_prefill_s": 15.285897619993193,
"t_transfer_s": 0.9130747889867052,
"t_followup_s": 0.13272951598628424,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
},
{
"input_tokens": 65536,
"session": "526e3b3a3df64dea9e513e7bb9c3da53",
"t_step1_client_unix": 1780113921.172305,
"t_step2_client_unix": 1780113936.4544415,
"t_step2_end_unix": 1780113937.868287,
"t_prefill_s": 15.282098516006954,
"t_transfer_s": 1.4137536820198875,
"t_followup_s": 0.11649087502155453,
"cached_followup": 0,
"pull_completion_tokens": 1,
"ok": false
}
],
"summary": []
}