Classify infrastructure short-span outlier families

2026-04-18 14:48:00 -07:00 · 2026-04-18 14:48:00 -07:00 · 1a0653cff1
commit 1a0653cff1
parent d998c08219
3 changed files with 446 additions and 0 deletions
--- a/crates/rrt-runtime/src/smp.rs
+++ b/crates/rrt-runtime/src/smp.rs
@ -1953,9 +1953,95 @@ pub struct SmpSavePlacedStructureDynamicSideBufferPayloadEnvelopeSummary {
    pub name_prelude_candidate_summary:
        Option<SmpSavePlacedStructureDynamicSideBufferNamePreludeCandidateSummary>,
    #[serde(default)]
    pub dominant_profile_span_class_summary:
        Option<SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanClassSummary>,
    #[serde(default)]
    pub sample_rows: Vec<SmpSavePlacedStructureDynamicSideBufferPayloadEnvelopeSample>,
 }
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanClassSummary {
    pub profile_chunk_len_to_next_name_or_end: usize,
    pub row_count: usize,
    pub unique_name_pair_count: usize,
    pub unique_compact_prefix_pattern_count: usize,
    #[serde(default)]
    pub dominant_candidate_pattern:
        Option<SmpSavePlacedStructureDynamicSideBufferNamePreludeCandidatePattern>,
    #[serde(default)]
    pub dominant_primary_name: Option<String>,
    #[serde(default)]
    pub dominant_secondary_name: Option<String>,
    pub dominant_name_pair_count: usize,
    #[serde(default)]
    pub dominant_prefix_leading_dword: Option<u32>,
    #[serde(default)]
    pub dominant_prefix_leading_dword_hex: Option<String>,
    #[serde(default)]
    pub dominant_prefix_trailing_word: Option<u16>,
    #[serde(default)]
    pub dominant_prefix_trailing_word_hex: Option<String>,
    #[serde(default)]
    pub dominant_prefix_separator_byte: Option<u8>,
    #[serde(default)]
    pub dominant_prefix_separator_byte_hex: Option<String>,
    pub dominant_prefix_count: usize,
    #[serde(default)]
    pub sample_rows: Vec<SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanSample>,
    #[serde(default)]
    pub name_pair_summaries: Vec<SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanNamePairSummary>,
    #[serde(default)]
    pub compact_prefix_pattern_summaries:
        Vec<SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanPrefixSummary>,
    #[serde(default)]
    pub candidate_pattern_summaries:
        Vec<SmpSavePlacedStructureDynamicSideBufferNamePreludeCandidatePattern>,
 }
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanSample {
    pub sample_index: usize,
    pub name_tag_relative_offset: usize,
    #[serde(default)]
    pub primary_name: Option<String>,
    #[serde(default)]
    pub secondary_name: Option<String>,
    pub prefix_leading_dword: u32,
    pub prefix_leading_dword_hex: String,
    pub prefix_trailing_word: u16,
    pub prefix_trailing_word_hex: String,
    pub prefix_separator_byte: u8,
    pub prefix_separator_byte_hex: String,
    #[serde(default)]
    pub child_count_candidate: Option<u16>,
    #[serde(default)]
    pub child_count_candidate_hex: Option<String>,
    #[serde(default)]
    pub saved_primary_child_byte_candidate: Option<u8>,
    #[serde(default)]
    pub saved_primary_child_byte_candidate_hex: Option<String>,
 }
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanNamePairSummary {
    #[serde(default)]
    pub primary_name: Option<String>,
    #[serde(default)]
    pub secondary_name: Option<String>,
    pub count: usize,
 }
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanPrefixSummary {
    pub prefix_leading_dword: u32,
    pub prefix_leading_dword_hex: String,
    pub prefix_trailing_word: u16,
    pub prefix_trailing_word_hex: String,
    pub prefix_separator_byte: u8,
    pub prefix_separator_byte_hex: String,
    pub count: usize,
 }
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct SmpSavePlacedStructureDynamicSideBufferFixedPolicySummary {
    pub row_count_with_0x1a_policy_chunk: usize,
@ -4314,6 +4400,90 @@ fn build_infrastructure_asset_trace_report(
                        .map(|summary| summary.dominant_trailing_word_count)
                        .unwrap_or_default()
                ),
                side_buffer
                    .and_then(|probe| probe.payload_envelope_summary.as_ref())
                    .and_then(|summary| summary.dominant_profile_span_class_summary.as_ref())
                    .map(|summary| {
                        format!(
                            "the dominant 0x{:x}-byte post-profile class is now narrowed too: dominant name pair is {:?}/{:?} x{}, dominant compact prefix is {}/{}/{} x{}, and dominant prelude candidate is {}/{} x{} across {} rows",
                            summary.profile_chunk_len_to_next_name_or_end,
                            summary.dominant_primary_name,
                            summary.dominant_secondary_name,
                            summary.dominant_name_pair_count,
                            summary
                                .dominant_prefix_leading_dword_hex
                                .as_deref()
                                .unwrap_or("0x00000000"),
                            summary
                                .dominant_prefix_trailing_word_hex
                                .as_deref()
                                .unwrap_or("0x0000"),
                            summary
                                .dominant_prefix_separator_byte_hex
                                .as_deref()
                                .unwrap_or("0x00"),
                            summary.dominant_prefix_count,
                            summary
                                .dominant_candidate_pattern
                                .as_ref()
                                .map(|pattern| pattern.child_count_candidate_hex.as_str())
                                .unwrap_or("0x0000"),
                            summary
                                .dominant_candidate_pattern
                                .as_ref()
                                .map(|pattern| pattern.saved_primary_child_byte_candidate_hex.as_str())
                                .unwrap_or("0x00"),
                            summary
                                .dominant_candidate_pattern
                                .as_ref()
                                .map(|pattern| pattern.count)
                                .unwrap_or_default(),
                            summary.row_count
                        )
                    })
                    .unwrap_or_else(|| {
                        "no dominant post-profile class summary was available for the embedded 0x55f3 spans".to_string()
                    }),
                side_buffer
                    .and_then(|probe| probe.payload_envelope_summary.as_ref())
                    .and_then(|summary| summary.dominant_profile_span_class_summary.as_ref())
                    .map(|summary| {
                        format!(
                            "the dominant post-profile outliers are now explicit too: name-pair counts={:?}, compact-prefix counts={:?}, candidate-pattern counts={:?}",
                            summary
                                .name_pair_summaries
                                .iter()
                                .map(|entry| format!(
                                    "{:?}/{:?}:{}",
                                    entry.primary_name, entry.secondary_name, entry.count
                                ))
                                .collect::<Vec<_>>(),
                            summary
                                .compact_prefix_pattern_summaries
                                .iter()
                                .map(|entry| format!(
                                    "{}/{}/{}:{}",
                                    entry.prefix_leading_dword_hex,
                                    entry.prefix_trailing_word_hex,
                                    entry.prefix_separator_byte_hex,
                                    entry.count
                                ))
                                .collect::<Vec<_>>(),
                            summary
                                .candidate_pattern_summaries
                                .iter()
                                .map(|entry| format!(
                                    "{}/{}:{}",
                                    entry.child_count_candidate_hex,
                                    entry.saved_primary_child_byte_candidate_hex,
                                    entry.count
                                ))
                                .collect::<Vec<_>>()
                        )
                    })
                    .unwrap_or_else(|| {
                        "no dominant post-profile outlier breakdown was available".to_string()
                    }),
                side_buffer
                    .and_then(|probe| probe.payload_envelope_summary.as_ref())
                    .and_then(|summary| summary.name_prelude_candidate_summary.as_ref())
@ -13140,6 +13310,256 @@ fn parse_save_placed_structure_dynamic_side_buffer_probe(
                    )
                    .collect(),
            });
        let dominant_profile_span_class_summary = dominant_profile_chunk_len
            .map(|(dominant_profile_span_len, _)| {
                let dominant_rows = embedded_name_rows
                    .iter()
                    .zip(payload_envelope_rows.iter())
                    .filter_map(|(name_row, envelope_row)| {
                        (envelope_row.profile_chunk_len_to_next_name_or_end
                            == Some(dominant_profile_span_len))
                            .then(|| {
                                let candidate_offset =
                                    name_row.name_tag_relative_offset.checked_sub(3);
                                let child_count_candidate = candidate_offset
                                    .and_then(|offset| read_u16_at(records_payload, offset));
                                let saved_primary_child_byte_candidate = candidate_offset
                                    .and_then(|offset| read_u8_at(records_payload, offset + 2));
                                (
                                    name_row.name_tag_relative_offset,
                                    name_row.primary_name.clone(),
                                    name_row.secondary_name.clone(),
                                    name_row.prefix_leading_dword,
                                    name_row.prefix_trailing_word,
                                    name_row.prefix_separator_byte,
                                    child_count_candidate,
                                    saved_primary_child_byte_candidate,
                                )
                            })
                    })
                    .collect::<Vec<_>>();
                let mut dominant_name_pair_counts =
                    BTreeMap::<(Option<String>, Option<String>), usize>::new();
                let mut dominant_prefix_counts = BTreeMap::<(u32, u16, u8), usize>::new();
                let mut dominant_candidate_pattern_counts = BTreeMap::<(u16, u8), usize>::new();
                for (
                    _,
                    primary_name,
                    secondary_name,
                    prefix_leading_dword,
                    prefix_trailing_word,
                    prefix_separator_byte,
                    child_count_candidate,
                    saved_primary_child_byte_candidate,
                ) in &dominant_rows
                {
                    *dominant_name_pair_counts
                        .entry((primary_name.clone(), secondary_name.clone()))
                        .or_default() += 1;
                    *dominant_prefix_counts
                        .entry((
                            *prefix_leading_dword,
                            *prefix_trailing_word,
                            *prefix_separator_byte,
                        ))
                        .or_default() += 1;
                    if let (Some(child_count_candidate), Some(saved_primary_child_byte_candidate)) =
                        (child_count_candidate, saved_primary_child_byte_candidate)
                    {
                        *dominant_candidate_pattern_counts
                            .entry((*child_count_candidate, *saved_primary_child_byte_candidate))
                            .or_default() += 1;
                    }
                }
                let dominant_name_pair = dominant_name_pair_counts
                    .iter()
                    .max_by(|(left_key, left_count), (right_key, right_count)| {
                        left_count
                            .cmp(right_count)
                            .then_with(|| right_key.cmp(left_key))
                    })
                    .map(|((primary_name, secondary_name), count)| {
                        (primary_name.clone(), secondary_name.clone(), *count)
                    });
                let dominant_prefix = dominant_prefix_counts
                    .iter()
                    .max_by(|(left_key, left_count), (right_key, right_count)| {
                        left_count
                            .cmp(right_count)
                            .then_with(|| right_key.cmp(left_key))
                    })
                    .map(
                        |((prefix_leading_dword, prefix_trailing_word, prefix_separator_byte), count)| {
                            (
                                *prefix_leading_dword,
                                *prefix_trailing_word,
                                *prefix_separator_byte,
                                *count,
                            )
                        },
                    );
                let dominant_candidate_pattern = dominant_candidate_pattern_counts
                    .iter()
                    .max_by(|(left_key, left_count), (right_key, right_count)| {
                        left_count
                            .cmp(right_count)
                            .then_with(|| right_key.cmp(left_key))
                    })
                    .map(
                        |((child_count_candidate, saved_primary_child_byte_candidate), count)| {
                            SmpSavePlacedStructureDynamicSideBufferNamePreludeCandidatePattern {
                                child_count_candidate: *child_count_candidate,
                                child_count_candidate_hex: format!(
                                    "0x{child_count_candidate:04x}"
                                ),
                                saved_primary_child_byte_candidate:
                                    *saved_primary_child_byte_candidate,
                                saved_primary_child_byte_candidate_hex: format!(
                                    "0x{saved_primary_child_byte_candidate:02x}"
                                ),
                                count: *count,
                            }
                        },
                    );
                let name_pair_summaries = dominant_name_pair_counts
                    .iter()
                    .map(|((primary_name, secondary_name), count)| {
                        SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanNamePairSummary {
                            primary_name: primary_name.clone(),
                            secondary_name: secondary_name.clone(),
                            count: *count,
                        }
                    })
                    .take(8)
                    .collect::<Vec<_>>();
                let compact_prefix_pattern_summaries = dominant_prefix_counts
                    .iter()
                    .map(
                        |((prefix_leading_dword, prefix_trailing_word, prefix_separator_byte), count)| {
                            SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanPrefixSummary {
                                prefix_leading_dword: *prefix_leading_dword,
                                prefix_leading_dword_hex: format!(
                                    "0x{prefix_leading_dword:08x}"
                                ),
                                prefix_trailing_word: *prefix_trailing_word,
                                prefix_trailing_word_hex: format!(
                                    "0x{prefix_trailing_word:04x}"
                                ),
                                prefix_separator_byte: *prefix_separator_byte,
                                prefix_separator_byte_hex: format!(
                                    "0x{prefix_separator_byte:02x}"
                                ),
                                count: *count,
                            }
                        },
                    )
                    .take(8)
                    .collect::<Vec<_>>();
                let candidate_pattern_summaries = dominant_candidate_pattern_counts
                    .iter()
                    .map(
                        |((child_count_candidate, saved_primary_child_byte_candidate), count)| {
                            SmpSavePlacedStructureDynamicSideBufferNamePreludeCandidatePattern {
                                child_count_candidate: *child_count_candidate,
                                child_count_candidate_hex: format!(
                                    "0x{child_count_candidate:04x}"
                                ),
                                saved_primary_child_byte_candidate:
                                    *saved_primary_child_byte_candidate,
                                saved_primary_child_byte_candidate_hex: format!(
                                    "0x{saved_primary_child_byte_candidate:02x}"
                                ),
                                count: *count,
                            }
                        },
                    )
                    .take(8)
                    .collect::<Vec<_>>();
                SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanClassSummary {
                    profile_chunk_len_to_next_name_or_end: dominant_profile_span_len,
                    row_count: dominant_rows.len(),
                    unique_name_pair_count: dominant_name_pair_counts.len(),
                    unique_compact_prefix_pattern_count: dominant_prefix_counts.len(),
                    dominant_candidate_pattern,
                    dominant_primary_name: dominant_name_pair
                        .as_ref()
                        .and_then(|(primary_name, _, _)| primary_name.clone()),
                    dominant_secondary_name: dominant_name_pair
                        .as_ref()
                        .and_then(|(_, secondary_name, _)| secondary_name.clone()),
                    dominant_name_pair_count: dominant_name_pair
                        .map(|(_, _, count)| count)
                        .unwrap_or_default(),
                    dominant_prefix_leading_dword: dominant_prefix
                        .map(|(prefix_leading_dword, _, _, _)| prefix_leading_dword),
                    dominant_prefix_leading_dword_hex: dominant_prefix.map(
                        |(prefix_leading_dword, _, _, _)| format!("0x{prefix_leading_dword:08x}"),
                    ),
                    dominant_prefix_trailing_word: dominant_prefix
                        .map(|(_, prefix_trailing_word, _, _)| prefix_trailing_word),
                    dominant_prefix_trailing_word_hex: dominant_prefix.map(
                        |(_, prefix_trailing_word, _, _)| format!("0x{prefix_trailing_word:04x}"),
                    ),
                    dominant_prefix_separator_byte: dominant_prefix
                        .map(|(_, _, prefix_separator_byte, _)| prefix_separator_byte),
                    dominant_prefix_separator_byte_hex: dominant_prefix.map(
                        |(_, _, prefix_separator_byte, _)| format!("0x{prefix_separator_byte:02x}"),
                    ),
                    dominant_prefix_count: dominant_prefix
                        .map(|(_, _, _, count)| count)
                        .unwrap_or_default(),
                    sample_rows: dominant_rows
                        .iter()
                        .take(8)
                        .enumerate()
                        .map(
                            |(
                                sample_index,
                                (
                                    name_tag_relative_offset,
                                    primary_name,
                                    secondary_name,
                                    prefix_leading_dword,
                                    prefix_trailing_word,
                                    prefix_separator_byte,
                                    child_count_candidate,
                                    saved_primary_child_byte_candidate,
                                ),
                            )| {
                                SmpSavePlacedStructureDynamicSideBufferDominantProfileSpanSample {
                                    sample_index,
                                    name_tag_relative_offset: *name_tag_relative_offset,
                                    primary_name: primary_name.clone(),
                                    secondary_name: secondary_name.clone(),
                                    prefix_leading_dword: *prefix_leading_dword,
                                    prefix_leading_dword_hex: format!(
                                        "0x{prefix_leading_dword:08x}"
                                    ),
                                    prefix_trailing_word: *prefix_trailing_word,
                                    prefix_trailing_word_hex: format!(
                                        "0x{prefix_trailing_word:04x}"
                                    ),
                                    prefix_separator_byte: *prefix_separator_byte,
                                    prefix_separator_byte_hex: format!(
                                        "0x{prefix_separator_byte:02x}"
                                    ),
                                    child_count_candidate: *child_count_candidate,
                                    child_count_candidate_hex: child_count_candidate
                                        .map(|value| format!("0x{value:04x}")),
                                    saved_primary_child_byte_candidate:
                                        *saved_primary_child_byte_candidate,
                                    saved_primary_child_byte_candidate_hex:
                                        saved_primary_child_byte_candidate
                                            .map(|value| format!("0x{value:02x}")),
                                }
                            },
                        )
                        .collect(),
                    name_pair_summaries,
                    compact_prefix_pattern_summaries,
                    candidate_pattern_summaries,
                }
            });
        let payload_envelope_summary = Some(
            SmpSavePlacedStructureDynamicSideBufferPayloadEnvelopeSummary {
                row_count_with_policy_tag_before_next_name,
@ -13159,6 +13579,7 @@ fn parse_save_placed_structure_dynamic_side_buffer_probe(
                short_profile_flag_pair_summary: short_profile_flag_pair_summary.clone(),
                fixed_policy_summary: fixed_policy_summary.clone(),
                name_prelude_candidate_summary: name_prelude_candidate_summary.clone(),
                dominant_profile_span_class_summary: dominant_profile_span_class_summary.clone(),
                sample_rows: payload_envelope_rows
                    .iter()
                    .take(8)
@ -23666,6 +24087,7 @@ mod tests {
                                sample_rows: Vec::new(),
                            },
                        ),
                        dominant_profile_span_class_summary: None,
                        sample_rows: Vec::new(),
                    },
                ),
--- a/docs/control-loop-atlas/runtime-roots-camera-and-support-families.md
+++ b/docs/control-loop-atlas/runtime-roots-camera-and-support-families.md
@ -2980,6 +2980,18 @@ The low helper strip beneath that shared family is tighter now too: `0x0052ecd0`
  while the zero-length class is a separate `0x0055 / 0x00` outlier across `18/18` rows and the
  `0x06` class is the only large mixed frontier left. So the next infrastructure pass should focus
  on classifying the mixed `0x06` rows instead of re-proving the pure-prelude `0x03` class.
  That `0x06` class is now narrower too: grounded `q.gms` shows the dominant short-span family as
  `BridgeSTWood_Section.3dp / Infrastructure` with compact prefix `0xff000000 / 0x0001 / 0xff`
  across `62/72` rows and dominant prelude candidate `0x0001 / 0xff` across `63/72` rows. So the
  next infrastructure pass should stop treating all short rows as equally ambiguous and focus on
  the smaller outlier families inside that class, especially the `BallastCap`-style zero-like
  rows and any remaining non-`0x0001 / 0xff` prelude candidates.
  Those outliers are explicit now too: the remaining `10` short-span rows on grounded `q.gms`
  break into `9` `BallastCapST_Cap.3dp / Infrastructure` rows with compact prefix
  `0xf3010100 / 0x0055 / 0x00` and candidate pattern `0x0055 / 0x00`, plus `1`
  `TrackCapST_Cap.3dp / Infrastructure` row with compact prefix `0xff0000ff / 0x0001 / 0xff`.
  So the next infrastructure pass should target the `BallastCap` outlier family first instead of
  spending time on the already-dominant bridge-section class.
  The child loader family is explicit now too: local `.rdata` at `0x005cfd00` proves the
  `Infrastructure` child vtable uses the shared tagged callback strip directly, with
  `+0x40 = 0x00455fc0`, `+0x48 = 0x00455870`, and `+0x4c = 0x00455930`. So the remaining
--- a/docs/rehost-queue.md
+++ b/docs/rehost-queue.md
@ -131,6 +131,18 @@ Working rule:
  with dominant pattern `0x0055 / 0x00` across `18/18` rows and the `0x06` class remains the only
  large mixed frontier. So the next infrastructure slice should focus on classifying the mixed
  `0x06` rows, not on rediscovering the already-grounded pure-prelude `0x03` rows.
 - That `0x06` class is now narrower too: grounded `q.gms` shows the dominant short-span class as
  `BridgeSTWood_Section.3dp / Infrastructure` with compact prefix `0xff000000 / 0x0001 / 0xff`
  across `62/72` rows and dominant prelude candidate `0x0001 / 0xff` across `63/72` rows. So the
  next infrastructure slice should stop treating the `0x06` class as uniformly ambiguous and focus
  on the smaller outlier families inside that class, especially the zero-like `BallastCap`-style
  rows and any remaining non-`0x0001 / 0xff` prelude candidates.
 - Those outliers are explicit now too: the remaining `10` short-span rows on grounded `q.gms`
  break into `9` `BallastCapST_Cap.3dp / Infrastructure` rows with compact prefix
  `0xf3010100 / 0x0055 / 0x00` and candidate pattern `0x0055 / 0x00`, plus `1`
  `TrackCapST_Cap.3dp / Infrastructure` row with compact prefix `0xff0000ff / 0x0001 / 0xff`.
  So the next infrastructure slice should target the `BallastCap` outlier family first, not the
  already-dominant bridge-section class.
 - Reconstruct the save-side region record body on top of the newly corrected non-direct tagged
  region seam (`0x5209/0x520a/0x520b`, stride hint `0x06`, `Marker09` record stems) now that the
  `0x55f3` payload is known to be fully consumed by the embedded profile collection on grounded