The old src/ppc.rs that re-implemented PPC formatting collapses into a 30-line shim that delegates to xenia-cpu's single-source-of-truth disasm. A new disasm.rs wraps the shared iterator and feeds enriched items (analysis context: function membership, xrefs, mnemonics) into pluggable sinks. Sinks split: text.rs (objdump-like output), json.rs (JSONL stream matching the new xenia dis --json mode), duckdb.rs (the analysis DB ingest). db.rs is restructured into ingest_instructions + write_analysis_results so a run can stop after raw ingest, and a new target_hex column lands on the instructions table. sql_views.rs adds five additive views layered on top of the raw tables. Tests: assert-based JSON-fixture goldens (disasm_goldens) and a PRAGMA-table_info schema golden (db_schema_golden) covering all ingested tables and the SQL views. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
64 lines
1.9 KiB
Rust
64 lines
1.9 KiB
Rust
//! JSON Lines sink — one structured row per line, constant memory.
|
|
//!
|
|
//! Suited for piping into `jq`, importing into pandas / DuckDB's
|
|
//! `read_json_auto`, or feeding downstream tooling that expects a
|
|
//! line-delimited stream rather than a single megaobject.
|
|
|
|
use std::io::{self, Write};
|
|
|
|
use serde::Serialize;
|
|
|
|
use crate::disasm::RichDisasmItem;
|
|
|
|
#[derive(Serialize)]
|
|
struct JsonRow<'a> {
|
|
addr: u32,
|
|
raw: u32,
|
|
mnemonic: &'a str,
|
|
operands: &'a str,
|
|
disasm: &'a str,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
ext_mnemonic: Option<&'a str>,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
ext_operands: Option<&'a str>,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
ext_disasm: Option<&'a str>,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
branch_target: Option<u32>,
|
|
section: &'a str,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
function: Option<u32>,
|
|
#[serde(skip_serializing_if = "Option::is_none")]
|
|
label: Option<&'a str>,
|
|
}
|
|
|
|
/// Write each item as a single JSON object on its own line. Returns the
|
|
/// number of rows written.
|
|
pub fn write_jsonl<'a, W: Write>(
|
|
out: &mut W,
|
|
items: impl IntoIterator<Item = RichDisasmItem<'a>>,
|
|
) -> io::Result<u64> {
|
|
let mut count: u64 = 0;
|
|
for ri in items {
|
|
let t = &ri.item.text;
|
|
let row = JsonRow {
|
|
addr: ri.item.addr,
|
|
raw: ri.item.raw,
|
|
mnemonic: &t.mnemonic,
|
|
operands: &t.operands,
|
|
disasm: &t.disasm,
|
|
ext_mnemonic: t.ext_mnemonic.as_deref(),
|
|
ext_operands: t.ext_operands.as_deref(),
|
|
ext_disasm: t.ext_disasm.as_deref(),
|
|
branch_target: t.branch_target,
|
|
section: ri.section,
|
|
function: ri.function,
|
|
label: ri.label,
|
|
};
|
|
serde_json::to_writer(&mut *out, &row)?;
|
|
out.write_all(b"\n")?;
|
|
count += 1;
|
|
}
|
|
Ok(count)
|
|
}
|