feat(cli): [stale] tag on plain ask citations (fb-32)

Mirror of Task 9's search-output rendering: yellow [stale] on TTY, plain text otherwise. JSON path inherits via serde on AnswerCitation. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-09 02:34:58 +09:00
parent 15cdc97cae
commit aeee7ed771
2 changed files with 372 additions and 20 deletions
--- a/crates/kebab-cli/src/main.rs
+++ b/crates/kebab-cli/src/main.rs
@@ -614,26 +614,12 @@ fn run(cli: &Cli) -> anyhow::Result<()> {
                // `근거:` header.
                let print_citations = *show_citations && !*hide_citations;
                if print_citations && !ans.citations.is_empty() {
-                    println!();
-                    println!("근거:");
-                    for (idx, c) in ans.citations.iter().enumerate() {
-                        let marker = c
-                            .marker
-                            .clone()
-                            .unwrap_or_else(|| format!("{}", idx + 1));
-                        println!("  [{}] {}", marker, c.citation.to_uri());
-                    }
-                    // p9-fb-20: retrieval 메타는 citation 별 점수가
-                    // AnswerCitation 에 없는 (`top_score` 만 retrieval-
-                    // 전체 max) 한계상 한 줄로 분리. per-citation score
-                    // 노출은 facade + AnswerCitation 의 미래 확장 후.
-                    println!(
-                        "(retrieval: top_score={:.2}, k={}, used={}/{})",
-                        ans.retrieval.top_score,
-                        ans.retrieval.k,
-                        ans.retrieval.chunks_used,
-                        ans.retrieval.chunks_returned,
-                    );
+                    // p9-fb-32: yellow `[stale]` prefix on TTY (mirrors
+                    // the search renderer's pattern in `Cmd::Search`).
+                    use std::io::IsTerminal;
+                    let color = std::io::stdout().is_terminal();
+                    let mut out = std::io::stdout().lock();
+                    render_ask_plain_citations(&mut out, &ans, color)?;
                }
            }
            // Refusal → exit 1.
@@ -878,6 +864,54 @@ fn run(cli: &Cli) -> anyhow::Result<()> {
    }
 }

+/// p9-fb-32: render the plain (non-JSON) citation block for `kebab ask`.
+/// Mirrors the `Cmd::Search` plain renderer's `[stale]` convention —
+/// yellow ANSI on TTY, plain text otherwise. Detection uses stdlib
+/// `IsTerminal` at the call site; this function takes the resolved
+/// `color` boolean so tests can pin both branches deterministically.
+///
+/// Skipping the empty / no-citation path is the caller's responsibility
+/// (matches the original inline guard at the call site).
+fn render_ask_plain_citations(
+    w: &mut impl std::io::Write,
+    ans: &kebab_core::Answer,
+    color: bool,
+) -> std::io::Result<()> {
+    writeln!(w)?;
+    writeln!(w, "근거:")?;
+    for (idx, c) in ans.citations.iter().enumerate() {
+        let marker = c
+            .marker
+            .clone()
+            .unwrap_or_else(|| format!("{}", idx + 1));
+        // p9-fb-32: `[stale]` prefix on the URI for citations whose
+        // `stale: true`. Yellow on TTY, plain otherwise — mirrors the
+        // search-plain renderer in `Cmd::Search`.
+        let stale_tag = if c.stale {
+            if color {
+                "\x1b[33m[stale]\x1b[0m "
+            } else {
+                "[stale] "
+            }
+        } else {
+            ""
+        };
+        writeln!(w, "  [{}] {}{}", marker, stale_tag, c.citation.to_uri())?;
+    }
+    // p9-fb-20: retrieval 메타는 citation 별 점수가 AnswerCitation 에
+    // 없는 (`top_score` 만 retrieval-전체 max) 한계상 한 줄로 분리.
+    // per-citation score 노출은 facade + AnswerCitation 의 미래 확장 후.
+    writeln!(
+        w,
+        "(retrieval: top_score={:.2}, k={}, used={}/{})",
+        ans.retrieval.top_score,
+        ans.retrieval.k,
+        ans.retrieval.chunks_used,
+        ans.retrieval.chunks_returned,
+    )?;
+    Ok(())
+}
+
 fn print_schema_text(s: &kebab_app::SchemaV1) {
    println!("kebab v{}", s.kebab_version);
    println!();
@@ -955,3 +989,107 @@ fn confirm_destructive(
    Ok(matches!(s.as_str(), "y" | "yes"))
 }

+#[cfg(test)]
+mod tests {
+    //! p9-fb-32: unit tests for `render_ask_plain_citations`. The
+    //! integration end-to-end (`tests/wire_ask_stale.rs`) is gated on
+    //! a real Ollama, so we cover the renderer's `[stale]` logic here
+    //! against a synthetic `Answer` instead.
+    use super::*;
+    use kebab_core::{
+        Answer, AnswerCitation, AnswerRetrievalSummary, Citation, ModelRef,
+        PromptTemplateVersion, SearchMode, TokenUsage, TraceId, WorkspacePath,
+    };
+    use time::OffsetDateTime;
+
+    fn mk_answer(citations: Vec<AnswerCitation>) -> Answer {
+        Answer {
+            answer: "ans".into(),
+            citations,
+            grounded: true,
+            refusal_reason: None,
+            model: ModelRef {
+                id: "test".into(),
+                provider: "test".into(),
+                dimensions: None,
+            },
+            embedding: None,
+            prompt_template_version: PromptTemplateVersion("rag-v1".into()),
+            retrieval: AnswerRetrievalSummary {
+                trace_id: TraceId("ret_test".into()),
+                mode: SearchMode::Lexical,
+                k: 5,
+                score_gate: 0.30,
+                top_score: 0.80,
+                chunks_returned: 1,
+                chunks_used: 1,
+            },
+            usage: TokenUsage {
+                prompt_tokens: 0,
+                completion_tokens: 0,
+                latency_ms: 0,
+            },
+            created_at: OffsetDateTime::now_utc(),
+            conversation_id: None,
+            turn_index: None,
+        }
+    }
+
+    fn mk_citation(path: &str, stale: bool) -> AnswerCitation {
+        AnswerCitation {
+            marker: Some("1".into()),
+            citation: Citation::Line {
+                path: WorkspacePath::new(path.into()).unwrap(),
+                start: 1,
+                end: 1,
+                section: None,
+            },
+            indexed_at: OffsetDateTime::now_utc(),
+            stale,
+        }
+    }
+
+    #[test]
+    fn plain_marks_stale_citation_no_color() {
+        let ans = mk_answer(vec![mk_citation("a.md", true)]);
+        let mut buf = Vec::new();
+        render_ask_plain_citations(&mut buf, &ans, false).unwrap();
+        let out = String::from_utf8(buf).unwrap();
+        assert!(
+            out.contains("[stale]"),
+            "expected `[stale]` marker in plain output, got:\n{out}"
+        );
+        // No ANSI when color = false.
+        assert!(
+            !out.contains("\x1b["),
+            "unexpected ANSI escape in non-color output:\n{out}"
+        );
+    }
+
+    #[test]
+    fn plain_marks_stale_citation_color_uses_yellow_ansi() {
+        let ans = mk_answer(vec![mk_citation("a.md", true)]);
+        let mut buf = Vec::new();
+        render_ask_plain_citations(&mut buf, &ans, true).unwrap();
+        let out = String::from_utf8(buf).unwrap();
+        // Yellow ANSI + reset around the `[stale]` token, mirroring the
+        // search-plain renderer in `Cmd::Search`.
+        assert!(
+            out.contains("\x1b[33m[stale]\x1b[0m"),
+            "expected yellow [stale] ANSI sequence in color output, got:\n{out:?}"
+        );
+    }
+
+    #[test]
+    fn plain_no_stale_tag_for_fresh_citation() {
+        let ans = mk_answer(vec![mk_citation("a.md", false)]);
+        let mut buf = Vec::new();
+        render_ask_plain_citations(&mut buf, &ans, true).unwrap();
+        let out = String::from_utf8(buf).unwrap();
+        assert!(
+            !out.contains("[stale]"),
+            "unexpected `[stale]` marker for fresh citation:\n{out}"
+        );
+    }
+}
+
--- a/crates/kebab-cli/tests/wire_ask_stale.rs
+++ b/crates/kebab-cli/tests/wire_ask_stale.rs
@@ -0,0 +1,214 @@
+//! p9-fb-32: CLI ask output — JSON path emits `indexed_at` + `stale`
+//! on each citation; plain output prefixes stale citations with
+//! `[stale]` (yellow on TTY).
+//!
+//! These end-to-end checks exercise `kebab ask`, which requires a real
+//! Ollama on `127.0.0.1:11434` (same constraint as
+//! `kebab-app/tests/ask_smoke.rs`). Both tests are therefore
+//! `#[ignore]` by default — run with
+//! `cargo test -p kebab-cli --test wire_ask_stale -- --ignored`
+//! against a live Ollama.
+//!
+//! The `[stale]` rendering logic itself is also covered by a unit test
+//! in `kebab-cli/src/main.rs` (`tests::plain_marks_stale_citation_*`)
+//! that constructs a synthetic `Answer` and pipes it through
+//! `render_ask_plain_citations` — that path is the always-on guard.
+
+use std::fs;
+use std::path::{Path, PathBuf};
+use std::process::Command;
+
+/// Build a `config.toml` text under `dir`. `workspace_root` and
+/// `data_dir` live inside `dir`. `stale_threshold_days` is plumbed
+/// into `[search]` so the staleness post-process can fire.
+fn write_config(dir: &Path, stale_threshold_days: u32) -> (PathBuf, PathBuf, PathBuf) {
+    let workspace = dir.join("workspace");
+    let data = dir.join("data");
+    fs::create_dir_all(&workspace).unwrap();
+    fs::create_dir_all(&data).unwrap();
+
+    let cfg_path = dir.join("config.toml");
+    fs::write(
+        &cfg_path,
+        format!(
+            r#"schema_version = 1
+
+[workspace]
+root = "{workspace}"
+exclude = [".git/**"]
+
+[storage]
+data_dir = "{data}"
+sqlite = "{{data_dir}}/kebab.sqlite"
+vector_dir = "{{data_dir}}/lancedb"
+asset_dir = "{{data_dir}}/assets"
+artifact_dir = "{{data_dir}}/artifacts"
+model_dir = "{{data_dir}}/models"
+runs_dir = "{{data_dir}}/runs"
+copy_threshold_mb = 100
+
+[indexing]
+max_parallel_extractors = 2
+max_parallel_embeddings = 1
+watch_filesystem = false
+
+[chunking]
+target_tokens = 80
+overlap_tokens = 20
+respect_markdown_headings = true
+chunker_version = "md-heading-v1"
+
+[models.embedding]
+provider = "none"
+model = "none"
+version = "v0"
+dimensions = 0
+batch_size = 1
+
+[models.llm]
+provider = "ollama"
+model = "gemma4:e4b"
+context_tokens = 4096
+endpoint = "http://127.0.0.1:11434"
+temperature = 0.0
+seed = 0
+
+[search]
+default_k = 10
+hybrid_fusion = "rrf"
+rrf_k = 60
+snippet_chars = 220
+stale_threshold_days = {stale_threshold_days}
+
+[rag]
+prompt_template_version = "rag-v1"
+score_gate = 0.30
+explain_default = false
+max_context_tokens = 8000
+"#,
+            workspace = workspace.display(),
+            data = data.display(),
+            stale_threshold_days = stale_threshold_days,
+        ),
+    )
+    .unwrap();
+    (cfg_path, workspace, data)
+}
+
+fn ingest(cfg: &Path, workspace: &Path) {
+    let bin = env!("CARGO_BIN_EXE_kebab");
+    let out = Command::new(bin)
+        .args([
+            "--config",
+            cfg.to_str().unwrap(),
+            "ingest",
+            "--root",
+            workspace.to_str().unwrap(),
+        ])
+        .output()
+        .unwrap();
+    assert!(
+        out.status.success(),
+        "ingest failed: stderr={}",
+        String::from_utf8_lossy(&out.stderr)
+    );
+}
+
+/// Run `kebab ask` in lexical mode (no embedding required). `json`
+/// toggles `--json`. The caller asserts on the resulting stdout.
+fn run_ask_lexical(cfg: &Path, query: &str, json: bool) -> std::process::Output {
+    let bin = env!("CARGO_BIN_EXE_kebab");
+    let mut cmd = Command::new(bin);
+    cmd.arg("--config").arg(cfg);
+    if json {
+        cmd.arg("--json");
+    }
+    cmd.args(["ask", "--mode", "lexical", query]);
+    cmd.output().unwrap()
+}
+
+/// Rewrite `documents.updated_at` for one workspace path to
+/// `now - days_ago` (RFC3339 UTC). Mirrors
+/// `kebab-app/tests/common/mod.rs::backdate_document_updated_at`.
+fn backdate_updated_at(data_dir: &Path, workspace_path: &str, days_ago: i64) {
+    let backdated = (time::OffsetDateTime::now_utc() - time::Duration::days(days_ago))
+        .format(&time::format_description::well_known::Rfc3339)
+        .expect("format backdated updated_at");
+    let db_path = data_dir.join("kebab.sqlite");
+    let conn = rusqlite::Connection::open(&db_path).expect("open kebab.sqlite");
+    let updated = conn
+        .execute(
+            "UPDATE documents SET updated_at = ?1 WHERE workspace_path = ?2",
+            rusqlite::params![backdated, workspace_path],
+        )
+        .expect("UPDATE documents.updated_at");
+    assert_eq!(
+        updated, 1,
+        "backdate_updated_at: expected to update exactly 1 row for {workspace_path}, got {updated}"
+    );
+}
+
+#[test]
+#[ignore = "requires real Ollama on 127.0.0.1:11434"]
+fn ask_json_citations_include_indexed_at_and_stale() {
+    let dir = tempfile::tempdir().unwrap();
+    let (cfg, workspace, data) = write_config(dir.path(), 30);
+    fs::write(workspace.join("a.md"), "# T\n\napples are fruit\n").unwrap();
+    ingest(&cfg, &workspace);
+    backdate_updated_at(&data, "a.md", 60);
+
+    // ask returns exit 1 on refusal; the JSON envelope still goes to
+    // stdout. Don't assert on `status.success()` — accept either path
+    // and require the citations array to be present + structurally valid.
+    let out = run_ask_lexical(&cfg, "what about apples", true);
+    let stdout = String::from_utf8_lossy(&out.stdout);
+    let answer: serde_json::Value = serde_json::from_str(stdout.trim())
+        .unwrap_or_else(|e| panic!("expected JSON answer, got {stdout:?}: {e}"));
+    let cits = answer["citations"]
+        .as_array()
+        .unwrap_or_else(|| panic!("expected citations array, got {answer}"));
+    if let Some(cit) = cits.first() {
+        // Schema fields are always present on a structurally-valid
+        // AnswerCitation (serde-derived per Task 2 + Task 8).
+        assert!(
+            cit.get("indexed_at").is_some(),
+            "missing indexed_at on citation: {cit}"
+        );
+        assert!(
+            cit.get("stale").is_some(),
+            "missing stale on citation: {cit}"
+        );
+        assert_eq!(
+            cit["stale"], true,
+            "doc backdated 60d at threshold 30d must be stale: {cit}"
+        );
+    }
+    // If the model refused with zero citations the schema-shape claim
+    // is vacuously true; the unit-test path
+    // (`tests::plain_marks_stale_citation_*` in main.rs) is the
+    // always-on guard.
+}
+
+#[test]
+#[ignore = "requires real Ollama on 127.0.0.1:11434"]
+fn ask_plain_marks_stale_citation() {
+    let dir = tempfile::tempdir().unwrap();
+    let (cfg, workspace, data) = write_config(dir.path(), 30);
+    fs::write(workspace.join("a.md"), "# T\n\napples are fruit\n").unwrap();
+    ingest(&cfg, &workspace);
+    backdate_updated_at(&data, "a.md", 60);
+
+    // Refusal exits 1 — that's still fine here, the renderer prints
+    // the citation block before the refusal exit when citations exist.
+    // If the model refused with zero citations, this test is
+    // best-effort (skip the assert): the unit-test path in main.rs
+    // (`tests::plain_marks_stale_citation_*`) is the always-on guard.
+    let out = run_ask_lexical(&cfg, "what about apples", false);
+    let stdout = String::from_utf8_lossy(&out.stdout);
+    if stdout.contains("근거:") {
+        assert!(
+            stdout.contains("[stale]"),
+            "stale tag missing in plain ask output:\n{stdout}"
+        );
+    }
+}