feat(cli): [stale] tag on plain ask citations (fb-32)

Mirror of Task 9's search-output rendering: yellow [stale] on TTY,
plain text otherwise. JSON path inherits via serde on AnswerCitation.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
th-kim0823
2026-05-09 02:34:58 +09:00
parent 15cdc97cae
commit aeee7ed771
2 changed files with 372 additions and 20 deletions

View File

@@ -614,26 +614,12 @@ fn run(cli: &Cli) -> anyhow::Result<()> {
// `근거:` header.
let print_citations = *show_citations && !*hide_citations;
if print_citations && !ans.citations.is_empty() {
println!();
println!("근거:");
for (idx, c) in ans.citations.iter().enumerate() {
let marker = c
.marker
.clone()
.unwrap_or_else(|| format!("{}", idx + 1));
println!(" [{}] {}", marker, c.citation.to_uri());
}
// p9-fb-20: retrieval 메타는 citation 별 점수가
// AnswerCitation 에 없는 (`top_score` 만 retrieval-
// 전체 max) 한계상 한 줄로 분리. per-citation score
// 노출은 facade + AnswerCitation 의 미래 확장 후.
println!(
"(retrieval: top_score={:.2}, k={}, used={}/{})",
ans.retrieval.top_score,
ans.retrieval.k,
ans.retrieval.chunks_used,
ans.retrieval.chunks_returned,
);
// p9-fb-32: yellow `[stale]` prefix on TTY (mirrors
// the search renderer's pattern in `Cmd::Search`).
use std::io::IsTerminal;
let color = std::io::stdout().is_terminal();
let mut out = std::io::stdout().lock();
render_ask_plain_citations(&mut out, &ans, color)?;
}
}
// Refusal → exit 1.
@@ -878,6 +864,54 @@ fn run(cli: &Cli) -> anyhow::Result<()> {
}
}
/// p9-fb-32: render the plain (non-JSON) citation block for `kebab ask`.
/// Mirrors the `Cmd::Search` plain renderer's `[stale]` convention —
/// yellow ANSI on TTY, plain text otherwise. Detection uses stdlib
/// `IsTerminal` at the call site; this function takes the resolved
/// `color` boolean so tests can pin both branches deterministically.
///
/// Skipping the empty / no-citation path is the caller's responsibility
/// (matches the original inline guard at the call site).
fn render_ask_plain_citations(
w: &mut impl std::io::Write,
ans: &kebab_core::Answer,
color: bool,
) -> std::io::Result<()> {
writeln!(w)?;
writeln!(w, "근거:")?;
for (idx, c) in ans.citations.iter().enumerate() {
let marker = c
.marker
.clone()
.unwrap_or_else(|| format!("{}", idx + 1));
// p9-fb-32: `[stale]` prefix on the URI for citations whose
// `stale: true`. Yellow on TTY, plain otherwise — mirrors the
// search-plain renderer in `Cmd::Search`.
let stale_tag = if c.stale {
if color {
"\x1b[33m[stale]\x1b[0m "
} else {
"[stale] "
}
} else {
""
};
writeln!(w, " [{}] {}{}", marker, stale_tag, c.citation.to_uri())?;
}
// p9-fb-20: retrieval 메타는 citation 별 점수가 AnswerCitation 에
// 없는 (`top_score` 만 retrieval-전체 max) 한계상 한 줄로 분리.
// per-citation score 노출은 facade + AnswerCitation 의 미래 확장 후.
writeln!(
w,
"(retrieval: top_score={:.2}, k={}, used={}/{})",
ans.retrieval.top_score,
ans.retrieval.k,
ans.retrieval.chunks_used,
ans.retrieval.chunks_returned,
)?;
Ok(())
}
fn print_schema_text(s: &kebab_app::SchemaV1) {
println!("kebab v{}", s.kebab_version);
println!();
@@ -955,3 +989,107 @@ fn confirm_destructive(
Ok(matches!(s.as_str(), "y" | "yes"))
}
#[cfg(test)]
mod tests {
//! p9-fb-32: unit tests for `render_ask_plain_citations`. The
//! integration end-to-end (`tests/wire_ask_stale.rs`) is gated on
//! a real Ollama, so we cover the renderer's `[stale]` logic here
//! against a synthetic `Answer` instead.
use super::*;
use kebab_core::{
Answer, AnswerCitation, AnswerRetrievalSummary, Citation, ModelRef,
PromptTemplateVersion, SearchMode, TokenUsage, TraceId, WorkspacePath,
};
use time::OffsetDateTime;
fn mk_answer(citations: Vec<AnswerCitation>) -> Answer {
Answer {
answer: "ans".into(),
citations,
grounded: true,
refusal_reason: None,
model: ModelRef {
id: "test".into(),
provider: "test".into(),
dimensions: None,
},
embedding: None,
prompt_template_version: PromptTemplateVersion("rag-v1".into()),
retrieval: AnswerRetrievalSummary {
trace_id: TraceId("ret_test".into()),
mode: SearchMode::Lexical,
k: 5,
score_gate: 0.30,
top_score: 0.80,
chunks_returned: 1,
chunks_used: 1,
},
usage: TokenUsage {
prompt_tokens: 0,
completion_tokens: 0,
latency_ms: 0,
},
created_at: OffsetDateTime::now_utc(),
conversation_id: None,
turn_index: None,
}
}
fn mk_citation(path: &str, stale: bool) -> AnswerCitation {
AnswerCitation {
marker: Some("1".into()),
citation: Citation::Line {
path: WorkspacePath::new(path.into()).unwrap(),
start: 1,
end: 1,
section: None,
},
indexed_at: OffsetDateTime::now_utc(),
stale,
}
}
#[test]
fn plain_marks_stale_citation_no_color() {
let ans = mk_answer(vec![mk_citation("a.md", true)]);
let mut buf = Vec::new();
render_ask_plain_citations(&mut buf, &ans, false).unwrap();
let out = String::from_utf8(buf).unwrap();
assert!(
out.contains("[stale]"),
"expected `[stale]` marker in plain output, got:\n{out}"
);
// No ANSI when color = false.
assert!(
!out.contains("\x1b["),
"unexpected ANSI escape in non-color output:\n{out}"
);
}
#[test]
fn plain_marks_stale_citation_color_uses_yellow_ansi() {
let ans = mk_answer(vec![mk_citation("a.md", true)]);
let mut buf = Vec::new();
render_ask_plain_citations(&mut buf, &ans, true).unwrap();
let out = String::from_utf8(buf).unwrap();
// Yellow ANSI + reset around the `[stale]` token, mirroring the
// search-plain renderer in `Cmd::Search`.
assert!(
out.contains("\x1b[33m[stale]\x1b[0m"),
"expected yellow [stale] ANSI sequence in color output, got:\n{out:?}"
);
}
#[test]
fn plain_no_stale_tag_for_fresh_citation() {
let ans = mk_answer(vec![mk_citation("a.md", false)]);
let mut buf = Vec::new();
render_ask_plain_citations(&mut buf, &ans, true).unwrap();
let out = String::from_utf8(buf).unwrap();
assert!(
!out.contains("[stale]"),
"unexpected `[stale]` marker for fresh citation:\n{out}"
);
}
}

View File

@@ -0,0 +1,214 @@
//! p9-fb-32: CLI ask output — JSON path emits `indexed_at` + `stale`
//! on each citation; plain output prefixes stale citations with
//! `[stale]` (yellow on TTY).
//!
//! These end-to-end checks exercise `kebab ask`, which requires a real
//! Ollama on `127.0.0.1:11434` (same constraint as
//! `kebab-app/tests/ask_smoke.rs`). Both tests are therefore
//! `#[ignore]` by default — run with
//! `cargo test -p kebab-cli --test wire_ask_stale -- --ignored`
//! against a live Ollama.
//!
//! The `[stale]` rendering logic itself is also covered by a unit test
//! in `kebab-cli/src/main.rs` (`tests::plain_marks_stale_citation_*`)
//! that constructs a synthetic `Answer` and pipes it through
//! `render_ask_plain_citations` — that path is the always-on guard.
use std::fs;
use std::path::{Path, PathBuf};
use std::process::Command;
/// Build a `config.toml` text under `dir`. `workspace_root` and
/// `data_dir` live inside `dir`. `stale_threshold_days` is plumbed
/// into `[search]` so the staleness post-process can fire.
fn write_config(dir: &Path, stale_threshold_days: u32) -> (PathBuf, PathBuf, PathBuf) {
let workspace = dir.join("workspace");
let data = dir.join("data");
fs::create_dir_all(&workspace).unwrap();
fs::create_dir_all(&data).unwrap();
let cfg_path = dir.join("config.toml");
fs::write(
&cfg_path,
format!(
r#"schema_version = 1
[workspace]
root = "{workspace}"
exclude = [".git/**"]
[storage]
data_dir = "{data}"
sqlite = "{{data_dir}}/kebab.sqlite"
vector_dir = "{{data_dir}}/lancedb"
asset_dir = "{{data_dir}}/assets"
artifact_dir = "{{data_dir}}/artifacts"
model_dir = "{{data_dir}}/models"
runs_dir = "{{data_dir}}/runs"
copy_threshold_mb = 100
[indexing]
max_parallel_extractors = 2
max_parallel_embeddings = 1
watch_filesystem = false
[chunking]
target_tokens = 80
overlap_tokens = 20
respect_markdown_headings = true
chunker_version = "md-heading-v1"
[models.embedding]
provider = "none"
model = "none"
version = "v0"
dimensions = 0
batch_size = 1
[models.llm]
provider = "ollama"
model = "gemma4:e4b"
context_tokens = 4096
endpoint = "http://127.0.0.1:11434"
temperature = 0.0
seed = 0
[search]
default_k = 10
hybrid_fusion = "rrf"
rrf_k = 60
snippet_chars = 220
stale_threshold_days = {stale_threshold_days}
[rag]
prompt_template_version = "rag-v1"
score_gate = 0.30
explain_default = false
max_context_tokens = 8000
"#,
workspace = workspace.display(),
data = data.display(),
stale_threshold_days = stale_threshold_days,
),
)
.unwrap();
(cfg_path, workspace, data)
}
fn ingest(cfg: &Path, workspace: &Path) {
let bin = env!("CARGO_BIN_EXE_kebab");
let out = Command::new(bin)
.args([
"--config",
cfg.to_str().unwrap(),
"ingest",
"--root",
workspace.to_str().unwrap(),
])
.output()
.unwrap();
assert!(
out.status.success(),
"ingest failed: stderr={}",
String::from_utf8_lossy(&out.stderr)
);
}
/// Run `kebab ask` in lexical mode (no embedding required). `json`
/// toggles `--json`. The caller asserts on the resulting stdout.
fn run_ask_lexical(cfg: &Path, query: &str, json: bool) -> std::process::Output {
let bin = env!("CARGO_BIN_EXE_kebab");
let mut cmd = Command::new(bin);
cmd.arg("--config").arg(cfg);
if json {
cmd.arg("--json");
}
cmd.args(["ask", "--mode", "lexical", query]);
cmd.output().unwrap()
}
/// Rewrite `documents.updated_at` for one workspace path to
/// `now - days_ago` (RFC3339 UTC). Mirrors
/// `kebab-app/tests/common/mod.rs::backdate_document_updated_at`.
fn backdate_updated_at(data_dir: &Path, workspace_path: &str, days_ago: i64) {
let backdated = (time::OffsetDateTime::now_utc() - time::Duration::days(days_ago))
.format(&time::format_description::well_known::Rfc3339)
.expect("format backdated updated_at");
let db_path = data_dir.join("kebab.sqlite");
let conn = rusqlite::Connection::open(&db_path).expect("open kebab.sqlite");
let updated = conn
.execute(
"UPDATE documents SET updated_at = ?1 WHERE workspace_path = ?2",
rusqlite::params![backdated, workspace_path],
)
.expect("UPDATE documents.updated_at");
assert_eq!(
updated, 1,
"backdate_updated_at: expected to update exactly 1 row for {workspace_path}, got {updated}"
);
}
#[test]
#[ignore = "requires real Ollama on 127.0.0.1:11434"]
fn ask_json_citations_include_indexed_at_and_stale() {
let dir = tempfile::tempdir().unwrap();
let (cfg, workspace, data) = write_config(dir.path(), 30);
fs::write(workspace.join("a.md"), "# T\n\napples are fruit\n").unwrap();
ingest(&cfg, &workspace);
backdate_updated_at(&data, "a.md", 60);
// ask returns exit 1 on refusal; the JSON envelope still goes to
// stdout. Don't assert on `status.success()` — accept either path
// and require the citations array to be present + structurally valid.
let out = run_ask_lexical(&cfg, "what about apples", true);
let stdout = String::from_utf8_lossy(&out.stdout);
let answer: serde_json::Value = serde_json::from_str(stdout.trim())
.unwrap_or_else(|e| panic!("expected JSON answer, got {stdout:?}: {e}"));
let cits = answer["citations"]
.as_array()
.unwrap_or_else(|| panic!("expected citations array, got {answer}"));
if let Some(cit) = cits.first() {
// Schema fields are always present on a structurally-valid
// AnswerCitation (serde-derived per Task 2 + Task 8).
assert!(
cit.get("indexed_at").is_some(),
"missing indexed_at on citation: {cit}"
);
assert!(
cit.get("stale").is_some(),
"missing stale on citation: {cit}"
);
assert_eq!(
cit["stale"], true,
"doc backdated 60d at threshold 30d must be stale: {cit}"
);
}
// If the model refused with zero citations the schema-shape claim
// is vacuously true; the unit-test path
// (`tests::plain_marks_stale_citation_*` in main.rs) is the
// always-on guard.
}
#[test]
#[ignore = "requires real Ollama on 127.0.0.1:11434"]
fn ask_plain_marks_stale_citation() {
let dir = tempfile::tempdir().unwrap();
let (cfg, workspace, data) = write_config(dir.path(), 30);
fs::write(workspace.join("a.md"), "# T\n\napples are fruit\n").unwrap();
ingest(&cfg, &workspace);
backdate_updated_at(&data, "a.md", 60);
// Refusal exits 1 — that's still fine here, the renderer prints
// the citation block before the refusal exit when citations exist.
// If the model refused with zero citations, this test is
// best-effort (skip the assert): the unit-test path in main.rs
// (`tests::plain_marks_stale_citation_*`) is the always-on guard.
let out = run_ask_lexical(&cfg, "what about apples", false);
let stdout = String::from_utf8_lossy(&out.stdout);
if stdout.contains("근거:") {
assert!(
stdout.contains("[stale]"),
"stale tag missing in plain ask output:\n{stdout}"
);
}
}