waffle/src/ir.rs

476 lines
13 KiB
Rust
Raw Normal View History

2021-11-13 06:16:54 +00:00
//! Intermediate representation for Wasm.
use std::collections::hash_map::Entry;
2021-12-03 07:33:04 +00:00
use crate::{backend::Shape, cfg::CFGInfo, frontend, Operator};
2021-11-14 01:52:30 +00:00
use anyhow::Result;
2021-11-22 01:15:26 +00:00
use fxhash::FxHashMap;
2021-12-03 07:33:04 +00:00
use wasmparser::{FuncType, Type};
2021-11-13 06:16:54 +00:00
pub type SignatureId = usize;
pub type FuncId = usize;
2021-11-13 08:20:02 +00:00
pub type BlockId = usize;
pub type InstId = usize;
pub type LocalId = u32;
2021-12-03 07:33:04 +00:00
pub type GlobalId = u32;
pub type TableId = u32;
pub type MemoryId = u32;
2021-11-13 06:16:54 +00:00
2021-11-15 07:56:56 +00:00
pub const INVALID_BLOCK: BlockId = usize::MAX;
2021-11-13 22:23:22 +00:00
#[derive(Clone, Debug, Default)]
2021-11-13 10:32:05 +00:00
pub struct Module<'a> {
2021-11-14 08:00:34 +00:00
pub orig_bytes: &'a [u8],
2021-11-22 07:12:07 +00:00
pub funcs: Vec<FuncDecl>,
2021-11-13 06:16:54 +00:00
pub signatures: Vec<FuncType>,
pub globals: Vec<Type>,
pub tables: Vec<Type>,
2021-11-13 06:16:54 +00:00
}
#[derive(Clone, Debug)]
2021-11-22 07:12:07 +00:00
pub enum FuncDecl {
2021-11-13 06:16:54 +00:00
Import(SignatureId),
2021-11-22 07:12:07 +00:00
Body(SignatureId, FunctionBody),
2021-11-13 10:32:05 +00:00
}
2021-11-22 07:12:07 +00:00
impl FuncDecl {
2021-11-13 10:32:05 +00:00
pub fn sig(&self) -> SignatureId {
match self {
2021-11-13 11:49:19 +00:00
FuncDecl::Import(sig) => *sig,
FuncDecl::Body(sig, ..) => *sig,
2021-11-13 10:32:05 +00:00
}
}
2021-11-13 06:16:54 +00:00
}
#[derive(Clone, Debug, Default)]
2021-11-22 07:12:07 +00:00
pub struct FunctionBody {
2021-11-13 06:16:54 +00:00
pub locals: Vec<Type>,
2021-11-22 07:12:07 +00:00
pub blocks: Vec<Block>,
2021-12-03 07:33:04 +00:00
/// Sea-of-nodes representation.
pub values: Vec<ValueDef>,
value_dedup: FxHashMap<ValueDef, Value>,
pub types: Vec</* Value, */ Option<Type>>,
}
2021-12-03 07:33:04 +00:00
impl FunctionBody {
pub fn add_block(&mut self) -> BlockId {
let id = self.blocks.len();
self.blocks.push(Block::default());
self.blocks[id].id = id;
id
}
2021-12-03 07:33:04 +00:00
pub fn add_edge(&mut self, from: BlockId, to: BlockId) {
let succ_pos = self.blocks[from].succs.len();
let pred_pos = self.blocks[to].preds.len();
self.blocks[from].succs.push(to);
self.blocks[to].preds.push(from);
self.blocks[from].pos_in_succ_pred.push(pred_pos);
self.blocks[to].pos_in_pred_succ.push(succ_pos);
2021-11-15 07:56:56 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn add_value(&mut self, value: ValueDef, ty: Option<Type>) -> Value {
match self.value_dedup.entry(value.clone()) {
Entry::Occupied(o) => *o.get(),
Entry::Vacant(v) => {
let id = Value(self.values.len() as u32);
self.values.push(value);
self.types.push(ty);
v.insert(id);
id
}
}
}
pub fn set_alias(&mut self, value: Value, to: Value) {
// Resolve the `to` value through all existing aliases.
let to = self.resolve_alias(to);
// Disallow cycles.
if to == value {
panic!("Cannot create an alias cycle");
}
self.values[value.index()] = ValueDef::Alias(to);
}
pub fn resolve_alias(&self, value: Value) -> Value {
let mut result = value;
loop {
if let &ValueDef::Alias(to) = &self.values[result.index()] {
result = to;
} else {
break;
}
}
result
}
pub fn add_mutable_inst(&mut self, ty: Option<Type>, def: ValueDef) -> Value {
let value = Value(self.values.len() as u32);
2021-12-03 07:33:04 +00:00
self.types.push(ty);
self.values.push(def);
value
}
pub fn add_blockparam(&mut self, block: BlockId, ty: Type) {
self.blocks[block].params.push(ty);
}
pub fn add_placeholder(&mut self, ty: Type) -> Value {
self.add_mutable_inst(Some(ty), ValueDef::Placeholder)
}
pub fn replace_placeholder_with_blockparam(&mut self, block: BlockId, value: Value) {
assert!(self.values[value.index()] == ValueDef::Placeholder);
let ty = self.types[value.index()].unwrap();
let index = self.blocks[block].params.len();
self.blocks[block].params.push(ty);
self.values[value.index()] = ValueDef::BlockParam(block, index);
}
pub fn resolve_and_update_alias(&mut self, value: Value) -> Value {
let to = self.resolve_alias(value);
// Short-circuit the chain, union-find-style.
if let &ValueDef::Alias(orig_to) = &self.values[value.index()] {
if orig_to != to {
self.values[value.index()] = ValueDef::Alias(to);
}
}
to
2021-11-15 07:56:56 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn append_to_block(&mut self, block: BlockId, value: Value) {
self.blocks[block].insts.push(value);
2021-11-15 07:56:56 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn end_block(&mut self, block: BlockId, terminator: Terminator) {
terminator.visit_successors(|succ| {
self.add_edge(block, succ);
});
self.blocks[block].terminator = terminator;
2021-11-15 07:56:56 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn add_local(&mut self, ty: Type) -> LocalId {
let id = self.locals.len() as LocalId;
self.locals.push(ty);
id
}
}
2021-12-03 07:33:04 +00:00
impl std::ops::Index<Value> for FunctionBody {
type Output = ValueDef;
fn index(&self, index: Value) -> &ValueDef {
&self.values[index.0 as usize]
}
}
impl std::ops::IndexMut<Value> for FunctionBody {
fn index_mut(&mut self, index: Value) -> &mut ValueDef {
&mut self.values[index.0 as usize]
}
}
impl std::ops::Index<BlockId> for FunctionBody {
type Output = Block;
fn index(&self, index: BlockId) -> &Block {
&self.blocks[index]
}
}
impl std::ops::IndexMut<BlockId> for FunctionBody {
fn index_mut(&mut self, index: BlockId) -> &mut Block {
&mut self.blocks[index]
2021-11-22 07:12:07 +00:00
}
}
2021-12-03 07:33:04 +00:00
#[derive(Clone, Debug, Default)]
pub struct Block {
pub id: BlockId,
/// Side-effecting values from the sea-of-nodes that are computed, in order.
pub insts: Vec<Value>,
/// Terminator: branch or return.
pub terminator: Terminator,
/// Successor blocks.
pub succs: Vec<BlockId>,
/// For each successor block, our index in its `preds` array.
pub pos_in_succ_pred: Vec<usize>,
/// Predecessor blocks.
pub preds: Vec<BlockId>,
/// For each predecessor block, our index in its `succs` array.
pub pos_in_pred_succ: Vec<usize>,
/// Type of each blockparam.
pub params: Vec<Type>,
2021-11-13 22:23:22 +00:00
}
2021-12-03 07:33:04 +00:00
#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub struct Value(u32);
2021-11-22 01:15:26 +00:00
impl std::fmt::Display for Value {
fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
write!(f, "v{}", self.0)
}
}
2021-11-22 01:15:26 +00:00
impl Value {
pub fn undef() -> Self {
2021-12-03 07:33:04 +00:00
Value(u32::MAX)
2021-11-22 01:15:26 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn index(self) -> usize {
self.0 as usize
2021-11-22 01:15:26 +00:00
}
2021-12-03 07:33:04 +00:00
pub fn from_index(value: usize) -> Value {
Self(value as u32)
2021-11-13 22:23:22 +00:00
}
2021-12-03 07:33:04 +00:00
}
2021-11-22 01:15:26 +00:00
2021-12-03 07:33:04 +00:00
impl std::default::Default for Value {
fn default() -> Self {
Value::undef()
2021-11-22 01:15:26 +00:00
}
2021-12-03 07:33:04 +00:00
}
2021-11-22 01:15:26 +00:00
2021-12-03 07:33:04 +00:00
#[derive(Clone, Debug, PartialEq, Eq, Hash)]
pub enum ValueDef {
Arg(usize),
BlockParam(BlockId, usize),
Operator(Operator, Vec<Value>),
PickOutput(Value, usize),
Alias(Value),
Placeholder,
2021-12-03 07:33:04 +00:00
}
2021-11-22 01:15:26 +00:00
2021-12-03 07:33:04 +00:00
impl ValueDef {
pub fn visit_uses<F: FnMut(Value)>(&self, mut f: F) {
match self {
2021-12-03 07:34:57 +00:00
&ValueDef::Arg { .. } => {}
&ValueDef::BlockParam { .. } => {}
&ValueDef::Operator(_, ref args) => {
2021-12-03 07:33:04 +00:00
for &arg in args {
f(arg);
}
}
&ValueDef::PickOutput(from, ..) => f(from),
&ValueDef::Alias(value) => f(value),
&ValueDef::Placeholder => {}
2021-11-22 01:15:26 +00:00
}
}
2021-11-22 07:12:07 +00:00
2021-12-03 07:33:04 +00:00
pub fn update_uses<F: FnMut(&mut Value)>(&mut self, mut f: F) {
match self {
2021-12-03 07:34:57 +00:00
&mut ValueDef::Arg { .. } => {}
&mut ValueDef::BlockParam { .. } => {}
&mut ValueDef::Operator(_, ref mut args) => {
2021-12-03 07:34:57 +00:00
for arg in args {
2021-12-03 07:33:04 +00:00
f(arg);
}
}
&mut ValueDef::PickOutput(ref mut from, ..) => f(from),
&mut ValueDef::Alias(ref mut value) => f(value),
&mut ValueDef::Placeholder => {}
2021-11-22 01:15:26 +00:00
}
}
}
#[derive(Clone, Debug)]
pub struct BlockTarget {
pub block: BlockId,
pub args: Vec<Value>,
}
2021-11-13 11:38:47 +00:00
#[derive(Clone, Debug)]
2021-11-14 08:00:34 +00:00
pub enum Terminator {
2021-11-13 11:38:47 +00:00
Br {
target: BlockTarget,
2021-11-13 11:38:47 +00:00
},
CondBr {
2021-11-22 01:15:26 +00:00
cond: Value,
if_true: BlockTarget,
if_false: BlockTarget,
2021-11-13 11:38:47 +00:00
},
Select {
2021-11-22 01:15:26 +00:00
value: Value,
targets: Vec<BlockTarget>,
default: BlockTarget,
2021-11-13 11:38:47 +00:00
},
Return {
2021-11-22 01:15:26 +00:00
values: Vec<Value>,
2021-11-13 11:38:47 +00:00
},
None,
}
2021-11-14 08:00:34 +00:00
impl std::default::Default for Terminator {
2021-11-13 11:38:47 +00:00
fn default() -> Self {
Terminator::None
}
}
2021-11-14 01:52:30 +00:00
2021-11-14 08:00:34 +00:00
impl Terminator {
pub fn visit_targets<F: FnMut(&BlockTarget)>(&self, mut f: F) {
2021-11-14 08:00:34 +00:00
match self {
2021-12-03 07:33:04 +00:00
Terminator::Return { .. } => {}
Terminator::Br { ref target, .. } => f(target),
2021-11-14 08:00:34 +00:00
Terminator::CondBr {
ref if_true,
ref if_false,
..
2021-11-14 08:00:34 +00:00
} => {
f(if_true);
f(if_false);
2021-11-14 08:00:34 +00:00
}
2021-11-14 04:59:37 +00:00
Terminator::Select {
ref targets,
ref default,
..
} => {
f(default);
for target in targets {
f(target);
}
}
Terminator::None => {}
}
}
pub fn update_targets<F: FnMut(&mut BlockTarget)>(&mut self, mut f: F) {
match self {
Terminator::Return { .. } => {}
Terminator::Br { ref mut target, .. } => f(target),
Terminator::CondBr {
ref mut if_true,
ref mut if_false,
2021-11-14 04:59:37 +00:00
..
} => {
f(if_true);
f(if_false);
}
Terminator::Select {
ref mut targets,
ref mut default,
..
} => {
f(default);
for target in targets {
2021-12-03 07:33:04 +00:00
f(target);
}
2021-11-14 04:59:37 +00:00
}
2021-12-03 07:33:04 +00:00
Terminator::None => {}
2021-11-14 04:59:37 +00:00
}
2021-11-14 01:52:30 +00:00
}
2021-11-22 07:12:07 +00:00
pub fn visit_target<F: FnMut(&BlockTarget)>(&self, index: usize, mut f: F) {
match (index, self) {
(0, Terminator::Br { ref target, .. }) => f(target),
(0, Terminator::CondBr { ref if_true, .. }) => {
f(if_true);
}
(1, Terminator::CondBr { ref if_false, .. }) => {
f(if_false);
}
(0, Terminator::Select { ref default, .. }) => {
f(default);
}
(i, Terminator::Select { ref targets, .. }) if i <= targets.len() => {
f(&targets[i - 1]);
}
_ => panic!("out of bounds"),
}
}
pub fn update_target<F: FnMut(&mut BlockTarget)>(&mut self, index: usize, mut f: F) {
match (index, self) {
(0, Terminator::Br { ref mut target, .. }) => f(target),
(
0,
Terminator::CondBr {
ref mut if_true, ..
},
) => {
f(if_true);
}
(
1,
Terminator::CondBr {
ref mut if_false, ..
},
) => {
f(if_false);
}
(
0,
Terminator::Select {
ref mut default, ..
},
) => {
f(default);
}
(
i,
Terminator::Select {
ref mut targets, ..
},
) if i <= targets.len() => {
f(&mut targets[i - 1]);
}
_ => panic!("out of bounds"),
}
}
pub fn visit_successors<F: FnMut(BlockId)>(&self, mut f: F) {
self.visit_targets(|target| f(target.block));
}
2021-11-22 07:12:07 +00:00
pub fn visit_uses<F: FnMut(Value)>(&self, mut f: F) {
self.visit_targets(|target| {
for &arg in &target.args {
f(arg);
}
});
2021-11-22 07:12:07 +00:00
match self {
&Terminator::CondBr { cond, .. } => f(cond),
&Terminator::Select { value, .. } => f(value),
&Terminator::Return { ref values, .. } => {
for &value in values {
f(value);
}
}
_ => {}
}
}
pub fn update_uses<F: FnMut(&mut Value)>(&mut self, mut f: F) {
self.update_targets(|target| {
for arg in &mut target.args {
f(arg);
}
});
2021-11-22 07:12:07 +00:00
match self {
&mut Terminator::CondBr { ref mut cond, .. } => f(cond),
&mut Terminator::Select { ref mut value, .. } => f(value),
&mut Terminator::Return { ref mut values, .. } => {
for value in values {
f(value);
}
}
_ => {}
}
}
2021-11-14 01:52:30 +00:00
}
2021-12-03 07:33:04 +00:00
impl<'a> Module<'a> {
pub fn from_wasm_bytes(bytes: &'a [u8]) -> Result<Self> {
frontend::wasm_to_ir(bytes)
}
pub fn to_wasm_bytes(self) -> Vec<u8> {
for func in &self.funcs {
match func {
&FuncDecl::Body(_, ref body) => {
let cfg = CFGInfo::new(body);
let _shape = Shape::compute(body, &cfg);
}
_ => {}
}
}
// TODO
self.orig_bytes.to_vec()
}
}