diff --git a/crates/xserv-server/src/engine.rs b/crates/xserv-server/src/engine.rs index 60a2055..253b072 100644 --- a/crates/xserv-server/src/engine.rs +++ b/crates/xserv-server/src/engine.rs @@ -396,9 +396,12 @@ fn emit_token(tokenizer: &Tokenizer, seq: &mut Sequence, token_id: u32) { if tokenizer.eos_token_id() == Some(token_id) { let tail = tokenizer.flush_decode_stream(&mut seq.decode_buffer); send_token_if_nonempty(seq, tail); - try_send_event(seq, GenerateEvent::Done { - finish_reason: "stop".to_string(), - }); + try_send_event( + seq, + GenerateEvent::Done { + finish_reason: "stop".to_string(), + }, + ); return; } @@ -407,9 +410,12 @@ fn emit_token(tokenizer: &Tokenizer, seq: &mut Sequence, token_id: u32) { let tail = tokenizer.flush_decode_stream(&mut seq.decode_buffer); send_token_if_nonempty(seq, text); send_token_if_nonempty(seq, tail); - try_send_event(seq, GenerateEvent::Done { - finish_reason: "length".to_string(), - }); + try_send_event( + seq, + GenerateEvent::Done { + finish_reason: "length".to_string(), + }, + ); } else { send_token_if_nonempty(seq, text); } diff --git a/crates/xserv-server/src/pp_engine.rs b/crates/xserv-server/src/pp_engine.rs index 05b98a0..42615cb 100644 --- a/crates/xserv-server/src/pp_engine.rs +++ b/crates/xserv-server/src/pp_engine.rs @@ -318,7 +318,12 @@ pub fn run_pp( /// Returns false if the send would block (client too slow) or the client is /// gone — the caller stops generating so the coordinator thread is free to /// admit the next request instead of blocking on one slow consumer. -fn emit_text(tokenizer: &Tokenizer, req: &GenerateRequest, token_id: u32, buf: &mut Vec) -> bool { +fn emit_text( + tokenizer: &Tokenizer, + req: &GenerateRequest, + token_id: u32, + buf: &mut Vec, +) -> bool { if tokenizer.is_eos(token_id) { return true; } diff --git a/crates/xserv-server/src/tp_engine.rs b/crates/xserv-server/src/tp_engine.rs index d8c3fb8..29c3f73 100644 --- a/crates/xserv-server/src/tp_engine.rs +++ b/crates/xserv-server/src/tp_engine.rs @@ -346,7 +346,12 @@ pub fn run_tp( /// Returns false if the send would block (client too slow) or the client is /// gone — the caller stops generating so the serial coordinator thread is free /// to admit the next request instead of blocking on one slow consumer. -fn emit_text(tokenizer: &Tokenizer, req: &GenerateRequest, token_id: u32, buf: &mut Vec) -> bool { +fn emit_text( + tokenizer: &Tokenizer, + req: &GenerateRequest, + token_id: u32, + buf: &mut Vec, +) -> bool { if tokenizer.is_eos(token_id) { return true; }