EffortlessMetrics
diff --git a/‎ci/hardware/intel-258v/2026-05-08/slm-answer-corpus-qwen25-cpu-clean-provenance.json‎
Lines changed: 14 additions & 3 deletions b/‎ci/hardware/intel-258v/2026-05-08/slm-answer-corpus-qwen25-cpu-clean-provenance.json‎
Lines changed: 14 additions & 3 deletions
diff --git a/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu-profiles/decode_128.json‎
Lines changed: 8 additions & 1 deletion b/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu-profiles/decode_128.json‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu-profiles/prefill_512.json‎
Lines changed: 8 additions & 1 deletion b/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu-profiles/prefill_512.json‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu.json‎
Lines changed: 9 additions & 2 deletions b/‎ci/hardware/intel-258v/2026-05-08/slm-phase-warm-session-qwen25-cpu.json‎
Lines changed: 9 additions & 2 deletions
diff --git a/‎crates/bitnet-cli/src/commands/answer_corpus.rs‎
Lines changed: 91 additions & 5 deletions b/‎crates/bitnet-cli/src/commands/answer_corpus.rs‎
Lines changed: 91 additions & 5 deletions
diff --git a/‎crates/bitnet-cli/src/main.rs‎
Lines changed: 16 additions & 0 deletions b/‎crates/bitnet-cli/src/main.rs‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎docs/tracking/campaigns/intel-258v-platform/CAMPAIGN.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/tracking/campaigns/intel-258v-platform/CAMPAIGN.md‎
Lines changed: 1 addition & 0 deletions
@@ -1,10 +1,11 @@
 {
   "artifact_kind": "slm_cpu_answer_corpus",
+  "backend_lane": "dense_slm_cpu",
   "backend": {
     "fallback_used": false,
     "requested_backend": "cpu",
     "runtime_api": "cpu",
-    "selected_backend": "cpu"
+    "selected_backend": "cpu-rust"
   },
   "cases": [
     {
@@ -633,6 +634,7 @@
     ]
   },
   "execution_plan": null,
+  "fallback_used": false,
   "generation": {
     "default_max_new_tokens": 16,
     "deterministic": true,
@@ -657,17 +659,26 @@
     "tokenizer": "gguf_metadata",
     "tokenizer_path": null
   },
-  "prompt_template": {
+  "model_architecture": "qwen2",
+  "model_family": "qwen",
+  "prompt_template": "qwen2.5",
+  "prompt_template_policy": {
     "family": "qwen2.5"
   },
+  "quantization": "Q8_0",
   "quality_summary": {
     "failed": 0,
     "not_run": 0,
     "passed": 3,
     "timeout": 0,
     "total": 3
   },
+  "requested_backend": "cpu",
   "schema_version": "1.0.0",
+  "selected_backend": "cpu-rust",
+  "selected_kernel_or_runtime": "dense-qwen-cpu-reference",
   "speedup_claim": false,
+  "runtime_api": "cpu",
+  "tokenizer_source": "gguf_metadata",
   "timestamp": "2026-05-12T21:48:18.738703300+00:00"
-}
+}
@@ -2,6 +2,7 @@
   "arc140v_claim": false,
   "artifact_kind": "dense_slm_cpu_phase_profile",
   "artifact_path": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu-profiles\\decode_128.json",
+  "backend_lane": "dense_slm_cpu",
   "bitnet_qk256_i2s_claim": false,
   "counts": {
     "n_kv": 26,
@@ -92,6 +93,8 @@
     "tokenizer": "gguf_metadata",
     "vocab_size": 151936
   },
+  "model_architecture": "qwen2",
+  "model_family": "qwen",
   "profile": {
     "backend": {
       "fallback_reason": null,
@@ -197,6 +200,8 @@
   },
   "profile_id": "decode_128",
   "prompt": "Answer with a deterministic continuation: one two three",
+  "prompt_template": "qwen2.5",
+  "quantization": "Q8_0",
   "prompt_render": {
     "add_bos": false,
     "parse_special": true,
@@ -208,6 +213,7 @@
   "runtime_api": "cpu",
   "schema_version": "1.0.0",
   "selected_backend": "cpu-rust",
+  "selected_kernel_or_runtime": "dense-qwen-cpu-reference",
   "session_artifact_path": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu.json",
   "speedup_claim": false,
   "strict_provenance": {
@@ -321,6 +327,7 @@
     "strict": true,
     "type": "gguf_metadata"
   },
+  "tokenizer_source": "gguf_metadata",
   "tokens": {
     "generated": 128,
     "generated_ids": [
@@ -625,4 +632,4 @@
     ],
     "total": 165
   }
-}
+}
@@ -2,6 +2,7 @@
   "arc140v_claim": false,
   "artifact_kind": "dense_slm_cpu_phase_profile",
   "artifact_path": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu-profiles\\prefill_512.json",
+  "backend_lane": "dense_slm_cpu",
   "bitnet_qk256_i2s_claim": false,
   "counts": {
     "n_kv": 26,
@@ -92,6 +93,8 @@
     "tokenizer": "gguf_metadata",
     "vocab_size": 151936
   },
+  "model_architecture": "qwen2",
+  "model_family": "qwen",
   "profile": {
     "backend": {
       "fallback_reason": null,
@@ -197,6 +200,8 @@
   },
   "profile_id": "prefill_512",
   "prompt": "benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token benchmark token ",
+  "prompt_template": "qwen2.5",
+  "quantization": "Q8_0",
   "prompt_render": {
     "add_bos": false,
     "parse_special": true,
@@ -208,6 +213,7 @@
   "runtime_api": "cpu",
   "schema_version": "1.0.0",
   "selected_backend": "cpu-rust",
+  "selected_kernel_or_runtime": "dense-qwen-cpu-reference",
   "session_artifact_path": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu.json",
   "speedup_claim": false,
   "strict_provenance": {
@@ -321,6 +327,7 @@
     "strict": true,
     "type": "gguf_metadata"
   },
+  "tokenizer_source": "gguf_metadata",
   "tokens": {
     "generated": 1,
     "generated_ids": [
@@ -875,4 +882,4 @@
     ],
     "total": 542
   }
-}
+}
@@ -1,6 +1,7 @@
 {
   "artifact_kind": "dense_slm_cpu_phase_warm_session",
   "artifact_path": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu.json",
+  "backend_lane": "dense_slm_cpu",
   "claim_boundary": {
     "arc140v_claim": false,
     "bitnet_answer_quality_claim": false,
@@ -62,6 +63,10 @@
     "tokenizer": "gguf_metadata",
     "vocab_size": 151936
   },
+  "model_architecture": "qwen2",
+  "model_family": "qwen",
+  "prompt_template": "qwen2.5",
+  "quantization": "Q8_0",
   "profiles": [
     {
       "decode_total_ms": 175.035,
@@ -92,6 +97,7 @@
   "runtime_api": "cpu",
   "schema_version": "1.0.0",
   "selected_backend": "cpu-rust",
+  "selected_kernel_or_runtime": "dense-qwen-cpu-reference",
   "session": {
     "model_loaded_once": true,
     "per_profile_receipt_dir": "ci\\hardware\\intel-258v\\2026-05-08\\slm-phase-warm-session-qwen25-cpu-profiles",
@@ -115,5 +121,6 @@
     "source": "gguf_metadata",
     "strict": true,
     "type": "gguf_metadata"
-  }
-}
+  },
+  "tokenizer_source": "gguf_metadata"
+}
@@ -174,11 +174,46 @@ impl AnswerCorpusCommand {
                 row["kernel"]["selected_kernel"] == "dense-qwen-cpu-reference"
                     && row["kernel"]["family"] == "dense_qwen"
             });
+        let top_level_selected_backend =
+            aggregate_case_str(&rows, &["backend", "selected_backend"])
+                .unwrap_or(device.as_str())
+                .to_string();
+        let top_level_runtime_api = aggregate_case_str(&rows, &["backend", "runtime_api"])
+            .unwrap_or_else(|| answer_corpus_runtime_api(&device))
+            .to_string();
+        let top_level_fallback_used =
+            rows.iter().any(|row| row["backend"]["fallback_used"].as_bool().unwrap_or(true));
+        let top_level_model_family =
+            corpus.model.family.as_deref().unwrap_or("unknown").to_string();
+        let top_level_model_architecture =
+            corpus.model.architecture.as_deref().unwrap_or("unknown").to_string();
+        let top_level_quantization =
+            corpus.model.quant_format.as_deref().unwrap_or("unknown").to_string();
+        let top_level_tokenizer_source = aggregate_case_str(&rows, &["tokenizer", "source"])
+            .unwrap_or(aggregate_tokenizer)
+            .to_string();
+        let top_level_selected_kernel_or_runtime =
+            aggregate_case_str(&rows, &["kernel", "selected_kernel"])
+                .unwrap_or(&top_level_runtime_api)
+                .to_string();
+        let top_level_backend_lane =
+            answer_corpus_backend_lane(&device, slm_answer_path, &top_level_model_family);
 
         let receipt = json!({
             "schema_version": "1.0.0",
             "artifact_kind": artifact_kind,
             "timestamp": chrono::Utc::now().to_rfc3339(),
+            "requested_backend": device.as_str(),
+            "selected_backend": top_level_selected_backend,
+            "runtime_api": top_level_runtime_api,
+            "fallback_used": top_level_fallback_used,
+            "backend_lane": top_level_backend_lane,
+            "model_family": top_level_model_family,
+            "model_architecture": top_level_model_architecture,
+            "quantization": top_level_quantization,
+            "tokenizer_source": top_level_tokenizer_source,
+            "prompt_template": corpus.defaults.prompt_template.as_str(),
+            "selected_kernel_or_runtime": top_level_selected_kernel_or_runtime,
             "corpus": {
                 "path": self.corpus.display().to_string(),
                 "name": corpus.name,
@@ -202,13 +237,13 @@ impl AnswerCorpusCommand {
             },
             "backend": {
                 "requested_backend": device.as_str(),
-                "selected_backend": device.as_str(),
-                "runtime_api": answer_corpus_runtime_api(&device),
-                "fallback_used": false,
+                "selected_backend": top_level_selected_backend,
+                "runtime_api": top_level_runtime_api,
+                "fallback_used": top_level_fallback_used,
             },
             "execution_plan": aggregate_execution_plan,
-            "prompt_template": {
-                "family": corpus.defaults.prompt_template,
+            "prompt_template_policy": {
+                "family": corpus.defaults.prompt_template.as_str(),
             },
             "generation": {
                 "mode": if corpus.defaults.greedy { "greedy" } else { "sampling" },
@@ -612,6 +647,32 @@ fn is_cuda_answer_corpus_device(device: &str) -> bool {
     matches!(device, "cuda" | RTX_5070_TI_CUDA)
 }
 
+fn answer_corpus_backend_lane(
+    device: &str,
+    slm_answer_path: bool,
+    model_family: &str,
+) -> &'static str {
+    if slm_answer_path && device == "cpu" && model_family == "qwen" {
+        "dense_slm_cpu"
+    } else if is_cuda_answer_corpus_device(device) {
+        "bitnet_cuda"
+    } else if device == "apple-m4-cpu-neon" {
+        "apple_m4_cpu_neon"
+    } else {
+        "bitnet_cpu"
+    }
+}
+
+fn aggregate_case_str<'a>(rows: &'a [Value], path: &[&str]) -> Option<&'a str> {
+    rows.iter().find_map(|row| {
+        let mut cursor = row;
+        for key in path {
+            cursor = cursor.get(*key)?;
+        }
+        cursor.as_str()
+    })
+}
+
 fn prompt_prefill_receipt(run_receipt: &Value) -> Value {
     let prompt_token_count = run_receipt["tokens"]["prompt"].as_u64().unwrap_or_else(|| {
         run_receipt["tokens"]["prompt_ids"]
@@ -1242,6 +1303,31 @@ mod tests {
         assert_eq!(effective_default_timeout_seconds(Some(0), Some(300)), 1);
     }
 
+    #[test]
+    fn slm_answer_aggregate_identity_uses_dense_cpu_lane() {
+        let rows = vec![json!({
+            "backend": {
+                "selected_backend": "cpu-rust",
+                "runtime_api": "cpu",
+                "fallback_used": false,
+            },
+            "kernel": {
+                "selected_kernel": "dense-qwen-cpu-reference",
+            },
+            "tokenizer": {
+                "source": "gguf_metadata",
+            },
+        })];
+
+        assert_eq!(aggregate_case_str(&rows, &["backend", "selected_backend"]), Some("cpu-rust"));
+        assert_eq!(
+            aggregate_case_str(&rows, &["kernel", "selected_kernel"]),
+            Some("dense-qwen-cpu-reference")
+        );
+        assert_eq!(aggregate_case_str(&rows, &["tokenizer", "source"]), Some("gguf_metadata"));
+        assert_eq!(answer_corpus_backend_lane("cpu", true, "qwen"), "dense_slm_cpu");
+    }
+
     #[test]
     fn cpu_answer_receipt_accepts_strict_cpu_truth() {
         let receipt = json!({
 
@@ -5975,6 +5975,7 @@ async fn run_cpu_phase_warm_session(
             pretokenizer_authority,
             tokenizer.as_ref(),
             dense_slm_model,
+            &prompt_template,
             model_quant_format,
             kernel_family,
             kernel_implementation,
@@ -6021,6 +6022,13 @@ async fn run_cpu_phase_warm_session(
         "runtime_api": backend_identity.runtime_api.as_str(),
         "fallback_used": false,
         "fallback_reason": serde_json::Value::Null,
+        "backend_lane": if dense_slm_model { "dense_slm_cpu" } else { hardware_lane },
+        "model_family": model_family,
+        "model_architecture": model_architecture,
+        "quantization": model_quant_format,
+        "tokenizer_source": tokenizer_source_str,
+        "prompt_template": prompt_template.as_str(),
+        "selected_kernel_or_runtime": selected_kernel.as_str(),
         "session": {
             "model_loaded_once": true,
             "tokenizer_loaded_once": true,
@@ -6253,6 +6261,7 @@ fn cpu_phase_strict_profile_receipt(
     pretokenizer_authority: &str,
     tokenizer: &(dyn bitnet_tokenizers::Tokenizer + Send + Sync),
     dense_slm_model: bool,
+    prompt_template_label: &str,
     model_quant_format: &str,
     kernel_family: &str,
     kernel_implementation: &str,
@@ -6291,6 +6300,13 @@ fn cpu_phase_strict_profile_receipt(
         "runtime_api": backend_identity.runtime_api.as_str(),
         "fallback_used": false,
         "fallback_reason": serde_json::Value::Null,
+        "backend_lane": if dense_slm_model { "dense_slm_cpu" } else { "bitnet_cpu" },
+        "model_family": model_family,
+        "model_architecture": model_architecture,
+        "quantization": model_quant_format,
+        "tokenizer_source": tokenizer_source_str,
+        "prompt_template": prompt_template_label,
+        "selected_kernel_or_runtime": selected_kernel,
         "prompt": run.prompt.as_str(),
         "prompt_render": {
             "template_family": run.prompt_template_family.as_str(),
 
@@ -74,6 +74,7 @@ Validate Core Ultra 7 258V as the BitNet CPU lead and tri-device platform while
 | SLM258V-004 | merged | Record dense Qwen SLM phase timing receipts on the 258V CPU path, keeping dense SLM phase evidence separate from BitNet QK256/I2_S receipts; merged in #4542. |
 | LNL258V-COMPARE-004 | merged | Refresh the same-machine comparison index after the corrected BitNet CPU bundle and dense Qwen SLM CPU answer/phase receipts, preserving independent BitNet CPU, dense SLM CPU, Arc 140V, and NPU claim boundaries; merged in #4545. |
 | CPU258V-032 | merged | Harden the 258V post-fix scalar-vs-AVX2 answer-parity receipt so top-level backend/runtime/fallback/kernel identity is explicit; merged in #4550. |
+| SLM258V-005 | pr_open | Harden dense Qwen SLM answer and phase receipts so top-level backend/runtime/fallback/model identity is explicit before OpenVINO CPU/GPU/NPU acceleration work; open in #4552. |
 
 ## Review Policy