KeiSeiKit-1.0/_primitives/_rust/kei-llm-llamacpp/tests/generate_stream.rs
Parfii-bot a4e667de10 KeiSeiKit-public — clean state
Single-commit clean baseline after security scrub of niche-tells,
project codenames, internal jargon, and contributor-email leaks.

Contents:
- 100 Rust crates (_primitives/_rust/)
- 37 agent manifests (_manifests/) + generated specs (_generated/)
- 67 user-invocable skills (skills/)
- 33 hooks (hooks/)
- Composition blocks (_blocks/)
- Documentation (docs/, README.md)
- TS adapter packages (_ts_packages/)
- Assembler (_assembler/)
- Roles (_roles/)
- Templates (_templates/)
- Forgejo CI (.forgejo/)

Author: Denis Parfionovich <info@greendragon.info>

License: see LICENSE.
2026-05-01 12:09:03 +08:00

37 lines
1.3 KiB
Rust

//! MockRunner emits N lines as if llama-cli streamed N tokens.
//! Stream API yields N+1 chunks (N tokens, then a `done: true` marker).
mod common;
use kei_llm_llamacpp::stream::generate_stream;
use kei_llm_llamacpp::GenerateOpts;
#[tokio::test]
async fn generate_stream_yields_tokens_plus_done() {
let td = tempfile::tempdir().unwrap();
let model = td.path().join("dummy.gguf");
std::fs::write(&model, b"x").unwrap();
let runner = common::MockRunner::new();
runner.push(common::Behaviour::Stream(vec![
"Hello".into(),
" ".into(),
"world".into(),
"llama_perf_context_print: footer ignored".into(),
]));
let opts = GenerateOpts::default();
let chunks = generate_stream(&runner, "llama-cli", &model, "p", &opts)
.await
.unwrap();
// 3 token lines + footer dropped + 1 done marker = 4 chunks total.
assert_eq!(chunks.len(), 4, "got {} chunks: {chunks:?}", chunks.len());
assert_eq!(chunks[0].delta, "Hello");
assert_eq!(chunks[0].tokens_so_far, 1);
assert!(!chunks[0].done);
assert_eq!(chunks[2].delta, "world");
assert_eq!(chunks[2].tokens_so_far, 3);
assert!(chunks[3].done, "last chunk must be done=true");
assert_eq!(chunks[3].tokens_so_far, 3, "tokens_so_far frozen at last token count");
}