Wasm: Parse the Code section to collect metadata for dead function elimination

This commit is contained in:
Brian Carroll 2022-01-11 09:43:14 +00:00
parent 48f14f9a83
commit 61d46be923

View file

@ -667,6 +667,29 @@ pub struct CodeSection<'a> {
pub code_builders: Vec<'a, CodeBuilder<'a>>,
}
#[derive(Debug)]
pub struct DeadCodeMetadata<'a> {
/// Byte offset (in the module) where each function body can be found
code_offsets: Vec<'a, u32>,
/// Vector with one entry per *call*, containing the called function's index
calls: Vec<'a, u32>,
/// Vector with one entry per *function*, indicating its offset in `calls`
calls_offsets: Vec<'a, u32>,
/// Return types of each function (for making almost-empty dummy replacements)
ret_types: Vec<'a, u8>,
}
impl<'a> DeadCodeMetadata<'a> {
pub fn new(arena: &'a Bump, func_count: usize) -> Self {
DeadCodeMetadata {
code_offsets: Vec::with_capacity_in(func_count, arena),
ret_types: Vec::with_capacity_in(func_count, arena),
calls: Vec::with_capacity_in(2 * func_count, arena),
calls_offsets: Vec::with_capacity_in(1 + func_count, arena),
}
}
}
impl<'a> CodeSection<'a> {
/// Serialize the code builders for all functions, and get code relocations with final offsets
pub fn serialize_with_relocs<T: SerialBuffer>(
@ -704,6 +727,61 @@ impl<'a> CodeSection<'a> {
code_builders: Vec::with_capacity_in(0, arena),
}
}
/// Parse a Code section, collecting metadata that we can use to figure out
/// which functions are actually called, and which are not.
/// This would normally be done in a linker optimisation, but we want to be able to
/// use this backend without a linker.
pub fn parse_dead_code_metadata(
arena: &'a Bump,
module_bytes: &[u8],
cursor: &mut usize,
) -> DeadCodeMetadata<'a> {
if module_bytes[*cursor] != SectionId::Code as u8 {
internal_error!("Expected Code section in object file at offset {}", *cursor);
}
*cursor += 1;
let section_size = parse_u32_or_panic(module_bytes, cursor);
let count_start = *cursor;
let section_end = count_start + section_size as usize;
let func_count = parse_u32_or_panic(module_bytes, cursor);
let mut metadata = DeadCodeMetadata::new(arena, func_count as usize);
while *cursor < section_end {
metadata.code_offsets.push(*cursor as u32);
metadata.calls_offsets.push(metadata.calls.len() as u32);
let func_size = parse_u32_or_panic(module_bytes, cursor);
let func_end = *cursor + func_size as usize;
// Local variable declarations
let local_groups_count = parse_u32_or_panic(module_bytes, cursor);
for _ in 0..local_groups_count {
let _group_len = parse_u32_or_panic(module_bytes, cursor);
*cursor += 1; // ValueType
}
// Instructions
while *cursor < func_end {
let opcode_byte: u8 = module_bytes[*cursor];
if opcode_byte == OpCode::CALL as u8 {
*cursor += 1;
let call_index = parse_u32_or_panic(module_bytes, cursor);
metadata.calls.push(call_index as u32);
} else {
OpCode::skip_bytes(module_bytes, cursor);
}
}
}
// Extra entries to mark the end of the last function
metadata.code_offsets.push(*cursor as u32);
metadata.calls_offsets.push(metadata.calls.len() as u32);
metadata
}
}
impl<'a> Serialize for CodeSection<'a> {