cs249r_book/tools/phase_d/f2_second_pass_manifest.json

[
  {
    "id": "edge-2357",
    "track": "edge",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/edge/edge-2357.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual alt text focuses on internal fragmentation, which the question explicitly excludes."
    ],
    "fix_suggestion": "Update visual alt text to contrast TLB entry count or page walk overhead instead of internal fragmentation."
  },
  {
    "id": "edge-2364",
    "track": "edge",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/edge/edge-2364.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual alt text incorrectly shows a saturated network switch, contradicting the scenario's conclusion that host memory is the bottleneck."
    ],
    "fix_suggestion": "Change visual to show host-memory/L3 cache as the saturated bottleneck, not the network switch."
  },
  {
    "id": "edge-2367",
    "track": "edge",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/edge/edge-2367.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "ERROR"
    },
    "issues": [
      "Visual alt text shows stages overlapping in a Gantt chart, but the solution explicitly states the multi-context execution is serial and cannot overlap."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "edge-2390",
    "track": "edge",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/edge/edge-2390.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "ERROR",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Scenario contains a template injection glitch ('4K @interviews/vault/questions/edge/edge-2460.yaml FPS')."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "edge-2401",
    "track": "edge",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/edge/edge-2401.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "WARN",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Generic PTQ vs QAT question; lacks strong uniqueness specific to Hailo-8 hardware."
    ],
    "fix_suggestion": "Make the scenario more specific to the Hailo-8's quantization toolchain rather than generic Min-Max vs Entropy."
  },
  {
    "id": "edge-2402",
    "track": "edge",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/edge/edge-2402.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "WARN",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Too similar to edge-2370 (testing Jetson power modes vs bandwidth/compute requirements)."
    ],
    "fix_suggestion": "Differentiate more clearly from edge-2370, perhaps focusing on a different resource constraint like thermal throttling."
  },
  {
    "id": "edge-2406",
    "track": "edge",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/edge/edge-2406.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Math error: Computes available FPS by dividing GOPs by utilization (26000/50/0.7 = 743) instead of multiplying by utilization (26000*0.7/50 = 364), fundamentally misunderstanding resource utilization."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "edge-2416",
    "track": "edge",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/edge/edge-2416.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "ERROR",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Exact duplicate scenario of edge-2363, just scaled lambda and mu by 0.5."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "edge-2424",
    "track": "edge",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/edge/edge-2424.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "WARN",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Standard QAT vs PTQ trade-off question that could apply to any hardware, lacks uniqueness."
    ],
    "fix_suggestion": "Focus more specifically on the Orin deployment tooling (TensorRT) and how to apply PTQ with limited calibration data instead of generic QAT vs PTQ."
  },
  {
    "id": "mobile-1870",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1870.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Math error: Claims K=12 is the minimum queue depth for P_K < 0.01, but K=11 yields P_11 = 0.0077, which is < 0.01."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1881",
    "track": "mobile",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1881.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual alt text includes an NPU, which is not part of the problem's described pipeline (Cloud -> Modem -> CPU -> UFS)."
    ],
    "fix_suggestion": "Change visual alt text to show the actual pipeline: Cloud -> 5G Modem -> Crypto Core -> UFS Storage, omitting the NPU."
  },
  {
    "id": "mobile-1891",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1891.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "ERROR"
    },
    "issues": [
      "Visual alt text claims a 75ms duration, but the correct overlapped mathematical solution is 400ms."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1896",
    "track": "mobile",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1896.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual stacked bar chart is physically misleading for visualizing harmonic mean of bandwidth."
    ],
    "fix_suggestion": "Change visual alt text to describe a time-based chart or throughput gauge rather than stacked bandwidth bars."
  },
  {
    "id": "mobile-1897",
    "track": "mobile",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1897.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual description only specifies incoming edges, missing the downlink traffic which is critical to the scenario."
    ],
    "fix_suggestion": "Update visual alt text to include bidirectional edges reflecting both uplink and downlink traffic."
  },
  {
    "id": "mobile-1903",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1903.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "ERROR"
    },
    "issues": [
      "The visual describes a sequential Gantt chart, which contradicts the core concept of a double-buffered overlapping pipeline."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1918",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1918.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Energy units are wrong. 5ms at 1W is 5 mJ, not 5.95 mWh. 1 mWh is 3600 mJ."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1929",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1929.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "WARN",
      "scenario_realism": "PASS",
      "uniqueness": "WARN",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Math is too simple for an L5 evaluation level.",
      "Scenario heavily duplicates the duty-cycling concept from mobile-1918."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1948",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1948.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "ERROR",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "It is physically impossible to place an LLM KV cache entirely in NPU-local SRAM on mobile SoCs due to extreme size constraints (hundreds of MBs vs <32MB SRAM)."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1949",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1949.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "WARN",
      "uniqueness": "WARN",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Highly generic template question lacking specific, hard constraints.",
      "Duplicates standard CPU vs NPU marketing talking points without depth."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1982",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1982.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "ERROR"
    },
    "issues": [
      "The visual alt text claims the queue drains over 300ms, heavily contradicting the mathematical solution of 2720ms."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-1995",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-1995.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "The solution completely ignores the 800 us OS preemption cost and the 18% thermal throttling penalty introduced in the prompt."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "mobile-2025",
    "track": "mobile",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/mobile/mobile-2025.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "WARN",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "L6+ level is a massive mismatch for a simple parameter count capacity subtraction problem."
    ],
    "fix_suggestion": "Lower the level to L3 or add advanced system-level architectural constraints to match L6+."
  },
  {
    "id": "mobile-2028",
    "track": "mobile",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/mobile/mobile-2028.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "The solution entirely fails to compute the budget for the mixed-precision fallback mode explicitly requested in the prompt."
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1562",
    "track": "tinyml",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1562.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "WARN"
    },
    "issues": [
      "Visual describes a 1000 MB/s link, ignoring the encoding/TLP overhead explicitly calculated in the math."
    ],
    "fix_suggestion": "Update the visual alt text to reflect the effective 886 MB/s link capacity instead of the raw line rate."
  },
  {
    "id": "tinyml-1634",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1634.yaml",
    "criteria": {
      "math_correct": "WARN",
      "cell_fit": "PASS",
      "scenario_realism": "WARN",
      "uniqueness": "PASS",
      "visual_alignment": "PASS"
    },
    "issues": [
      "Flash write speed of 100KB in 5ms (~20MB/s) is unrealistically fast for a Cortex-M4",
      "Multiple WARNs result in DROP"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1652",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1652.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "PASS",
      "scenario_realism": "WARN",
      "uniqueness": "WARN",
      "visual_alignment": "PASS"
    },
    "issues": [
      "Ring AllReduce on 3 bare-metal Cortex-M4 nodes is a highly synthetic scenario",
      "Duplicates standard GPU Ring AllReduce template (uniqueness warning)"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1661",
    "track": "tinyml",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1661.yaml",
    "criteria": {
      "math_correct": "WARN",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "PASS"
    },
    "issues": [
      "Solution incorrectly assumes the capacitor can fully discharge to 0V; it should account for the MCU brownout voltage threshold (e.g., ~1.8V)"
    ],
    "fix_suggestion": "Update the math to use E = 0.5 * C * (V_initial^2 - V_brownout^2) to reflect realistic usable energy."
  },
  {
    "id": "tinyml-1681",
    "track": "tinyml",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1681.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "WARN",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Level mismatch: solution provides a rough 1.2x heuristic instead of the explicit L6+ cycle-accurate cost model requested"
    ],
    "fix_suggestion": "Upgrade the solution's mathematical complexity to match L6+ cycle-accurate modeling expectations, or downgrade the level."
  },
  {
    "id": "tinyml-1716",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1716.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Solution completely ignores the 8% DMA contention factor it was explicitly asked to account for"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1721",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1721.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Solution fails to include the 3uA leakage in the calculation and omits the battery lifetime estimation entirely"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1723",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1723.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Math merely adds single buffer sizes (14.5KB) instead of calculating the SRAM footprint for a true overlapped buffering scheme"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1724",
    "track": "tinyml",
    "verdict_at_c3": "DROP",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1724.yaml",
    "criteria": {
      "math_correct": "ERROR",
      "cell_fit": "PASS",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Solution ignores half the prompt and completely fails to answer which retention mode wins"
    ],
    "fix_suggestion": ""
  },
  {
    "id": "tinyml-1732",
    "track": "tinyml",
    "verdict_at_c3": "NEEDS_FIX",
    "yaml_path": "interviews/vault/questions/tinyml/tinyml-1732.yaml",
    "criteria": {
      "math_correct": "PASS",
      "cell_fit": "WARN",
      "scenario_realism": "PASS",
      "uniqueness": "PASS",
      "visual_alignment": "N/A"
    },
    "issues": [
      "Solution fails to address the specific L2 mechanics of half-transfer interrupts and pointer swapping asked in the prompt"
    ],
    "fix_suggestion": "Update the solution to explicitly explain the half-transfer and full-transfer interrupts and the pointer swap logic requested."
  }
]