Wasynth/wasm/src/writer/luajit.rs
2021-12-14 04:31:53 -05:00

753 lines
17 KiB
Rust

use std::{collections::BTreeSet, io::Result};
use parity_wasm::elements::{External, ImportCountType, Instruction, Internal, Module};
use crate::{
analyzer::{localize, memory},
ast::{
builder::{Arities, Builder},
node::{
AnyBinOp, AnyCmpOp, AnyLoad, AnyStore, AnyUnOp, Backward, Br, BrIf, BrTable, Call,
CallIndirect, Else, Expression, Forward, Function, GetGlobal, GetLocal, If, Memorize,
MemoryGrow, MemorySize, Recall, Return, Select, SetGlobal, SetLocal, Statement, Value,
},
},
};
use super::{
shared::{
aux_internal_index, write_f32, write_f64, write_func_name, write_memory_init,
write_parameter_list, write_result_list, write_table_init, write_variable_list,
},
visit::{Transpiler, Writer},
};
fn write_expression(code: &[Instruction], w: Writer) -> Result<()> {
// FIXME: Badly generated WASM will produce the wrong constant.
for inst in code {
let result = match *inst {
Instruction::I32Const(v) => write!(w, "{} ", v),
Instruction::I64Const(v) => write!(w, "{}LL ", v),
Instruction::F32Const(v) => write_f32(f32::from_bits(v), w),
Instruction::F64Const(v) => write_f64(f64::from_bits(v), w),
Instruction::GetGlobal(i) => write!(w, "GLOBAL_LIST[{}].value ", i),
_ => {
continue;
}
};
return result;
}
write!(w, "error(\"mundane expression\")")
}
fn condense_jump_table(list: &[u32]) -> Vec<(usize, usize, u32)> {
let mut result = Vec::new();
let mut index = 0;
while index < list.len() {
let start = index;
loop {
index += 1;
// if end of list or next value is not equal, break
if index == list.len() || list[index - 1] != list[index] {
break;
}
}
result.push((start, index - 1, list[start]));
}
result
}
#[derive(Default)]
struct Visitor {
label_list: Vec<usize>,
num_label: usize,
num_param: u32,
}
impl Visitor {
fn push_label(&mut self) -> usize {
self.label_list.push(self.num_label);
self.num_label += 1;
self.num_label - 1
}
fn pop_label(&mut self) {
self.label_list.pop().unwrap();
}
fn get_label(&self, up: u32) -> usize {
let last = self.label_list.len() - 1;
self.label_list[last - up as usize]
}
}
trait Driver {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()>;
}
impl Driver for Recall {
fn visit(&self, _: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "reg_{} ", self.var)
}
}
impl Driver for Select {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "(")?;
write_as_condition(&self.cond, v, w)?;
write!(w, "and ")?;
self.a.visit(v, w)?;
write!(w, "or ")?;
self.b.visit(v, w)?;
write!(w, ")")
}
}
fn write_variable(var: u32, v: &Visitor, w: Writer) -> Result<()> {
if let Some(rem) = var.checked_sub(v.num_param) {
write!(w, "loc_{} ", rem)
} else {
write!(w, "param_{} ", var)
}
}
impl Driver for GetLocal {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_variable(self.var, v, w)
}
}
impl Driver for GetGlobal {
fn visit(&self, _: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "GLOBAL_LIST[{}].value ", self.var)
}
}
impl Driver for AnyLoad {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "load_{}(memory_at_0, ", self.op.as_name())?;
self.pointer.visit(v, w)?;
write!(w, "+ {})", self.offset)
}
}
impl Driver for MemorySize {
fn visit(&self, _: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "memory_at_{}.min ", self.memory)
}
}
impl Driver for MemoryGrow {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "rt.memory.grow(memory_at_{}, ", self.memory)?;
self.value.visit(v, w)?;
write!(w, ")")
}
}
impl Driver for Value {
fn visit(&self, _: &mut Visitor, w: Writer) -> Result<()> {
match self {
Self::I32(i) => write!(w, "{} ", i),
Self::I64(i) => write!(w, "{}LL ", i),
Self::F32(f) => write_f32(*f, w),
Self::F64(f) => write_f64(*f, w),
}
}
}
impl Driver for AnyUnOp {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
let (a, b) = self.op.as_name();
write!(w, "{}_{}(", a, b)?;
self.rhs.visit(v, w)?;
write!(w, ")")
}
}
fn write_bin_call(
op: (&str, &str),
lhs: &Expression,
rhs: &Expression,
v: &mut Visitor,
w: Writer,
) -> Result<()> {
write!(w, "{}_{}(", op.0, op.1)?;
lhs.visit(v, w)?;
write!(w, ", ")?;
rhs.visit(v, w)?;
write!(w, ")")
}
impl Driver for AnyBinOp {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
if let Some(op) = self.op.as_operator() {
write!(w, "(")?;
self.lhs.visit(v, w)?;
write!(w, "{} ", op)?;
self.rhs.visit(v, w)?;
write!(w, ")")
} else {
write_bin_call(self.op.as_name(), &self.lhs, &self.rhs, v, w)
}
}
}
fn write_any_cmp(cmp: &AnyCmpOp, v: &mut Visitor, w: Writer) -> Result<()> {
if let Some(op) = cmp.op.as_operator() {
cmp.lhs.visit(v, w)?;
write!(w, "{} ", op)?;
cmp.rhs.visit(v, w)
} else {
write_bin_call(cmp.op.as_name(), &cmp.lhs, &cmp.rhs, v, w)
}
}
impl Driver for AnyCmpOp {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "(")?;
write_any_cmp(self, v, w)?;
write!(w, "and 1 or 0)")
}
}
// Removes the boolean to integer conversion
fn write_as_condition(data: &Expression, v: &mut Visitor, w: Writer) -> Result<()> {
if let Expression::AnyCmpOp(o) = data {
write_any_cmp(o, v, w)
} else {
data.visit(v, w)?;
write!(w, "~= 0 ")
}
}
fn write_expr_list(list: &[Expression], v: &mut Visitor, w: Writer) -> Result<()> {
list.iter().enumerate().try_for_each(|(i, e)| {
if i != 0 {
write!(w, ", ")?;
}
e.visit(v, w)
})
}
impl Driver for Expression {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
match self {
Self::Recall(e) => e.visit(v, w),
Self::Select(e) => e.visit(v, w),
Self::GetLocal(e) => e.visit(v, w),
Self::GetGlobal(e) => e.visit(v, w),
Self::AnyLoad(e) => e.visit(v, w),
Self::MemorySize(e) => e.visit(v, w),
Self::MemoryGrow(e) => e.visit(v, w),
Self::Value(e) => e.visit(v, w),
Self::AnyUnOp(e) => e.visit(v, w),
Self::AnyBinOp(e) => e.visit(v, w),
Self::AnyCmpOp(e) => e.visit(v, w),
}
}
}
impl Driver for Memorize {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "reg_{} = ", self.var)?;
self.value.visit(v, w)
}
}
impl Driver for Forward {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
let label = v.push_label();
self.body.iter().try_for_each(|s| s.visit(v, w))?;
write!(w, "::continue_at_{}::", label)?;
v.pop_label();
Ok(())
}
}
impl Driver for Backward {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
let label = v.push_label();
write!(w, "::continue_at_{}::", label)?;
write!(w, "while true do ")?;
self.body.iter().try_for_each(|s| s.visit(v, w))?;
write!(w, "break ")?;
write!(w, "end ")?;
v.pop_label();
Ok(())
}
}
impl Driver for Else {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "else ")?;
self.body.iter().try_for_each(|s| s.visit(v, w))
}
}
impl Driver for If {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
let label = v.push_label();
write!(w, "if ")?;
write_as_condition(&self.cond, v, w)?;
write!(w, "then ")?;
self.truthy.iter().try_for_each(|s| s.visit(v, w))?;
if let Some(s) = &self.falsey {
s.visit(v, w)?;
}
write!(w, "::continue_at_{}::", label)?;
write!(w, "end ")?;
v.pop_label();
Ok(())
}
}
fn write_br_at(up: u32, v: &Visitor, w: Writer) -> Result<()> {
let level = v.get_label(up);
write!(w, "goto continue_at_{} ", level)
}
impl Driver for Br {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_br_at(self.target, v, w)
}
}
impl Driver for BrIf {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "if ")?;
write_as_condition(&self.cond, v, w)?;
write!(w, "then ")?;
write_br_at(self.target, v, w)?;
write!(w, "end ")
}
}
impl Driver for BrTable {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "temp = ")?;
self.cond.visit(v, w)?;
write!(w, " ")?;
for (start, end, dest) in condense_jump_table(&self.data.table) {
if start == end {
write!(w, "if temp == {} then ", start)?;
} else {
write!(w, "if temp >= {} and temp <= {} then ", start, end)?;
}
write_br_at(dest, v, w)?;
write!(w, "else")?;
}
write!(w, " ")?;
write_br_at(self.data.default, v, w)?;
write!(w, "end ")
}
}
impl Driver for Return {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "do return ")?;
self.list.iter().enumerate().try_for_each(|(i, r)| {
if i > 0 {
write!(w, ", ")?;
}
r.visit(v, w)
})?;
write!(w, "end ")
}
}
impl Driver for Call {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_result_list(self.result.clone(), w)?;
write!(w, "FUNC_LIST[{}](", self.func)?;
write_expr_list(&self.param_list, v, w)?;
write!(w, ")")
}
}
impl Driver for CallIndirect {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_result_list(self.result.clone(), w)?;
write!(w, "TABLE_LIST[{}].data[", self.table)?;
self.index.visit(v, w)?;
write!(w, "](")?;
write_expr_list(&self.param_list, v, w)?;
write!(w, ")")
}
}
impl Driver for SetLocal {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_variable(self.var, v, w)?;
write!(w, "= ")?;
self.value.visit(v, w)
}
}
impl Driver for SetGlobal {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "GLOBAL_LIST[{}].value = ", self.var)?;
self.value.visit(v, w)
}
}
impl Driver for AnyStore {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write!(w, "store_{}(memory_at_0, ", self.op.as_name())?;
self.pointer.visit(v, w)?;
write!(w, "+ {}, ", self.offset)?;
self.value.visit(v, w)?;
write!(w, ")")
}
}
impl Driver for Statement {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
match self {
Self::Unreachable => write!(w, "error(\"out of code bounds\")"),
Self::Memorize(s) => s.visit(v, w),
Self::Forward(s) => s.visit(v, w),
Self::Backward(s) => s.visit(v, w),
Self::If(s) => s.visit(v, w),
Self::Br(s) => s.visit(v, w),
Self::BrIf(s) => s.visit(v, w),
Self::BrTable(s) => s.visit(v, w),
Self::Return(s) => s.visit(v, w),
Self::Call(s) => s.visit(v, w),
Self::CallIndirect(s) => s.visit(v, w),
Self::SetLocal(s) => s.visit(v, w),
Self::SetGlobal(s) => s.visit(v, w),
Self::AnyStore(s) => s.visit(v, w),
}
}
}
impl Driver for Function {
fn visit(&self, v: &mut Visitor, w: Writer) -> Result<()> {
write_parameter_list(self, w)?;
for v in memory::visit(self) {
write!(w, "local memory_at_{0} = MEMORY_LIST[{0}]", v)?;
}
write!(w, "local temp ")?;
write_variable_list(self, w)?;
v.num_param = self.num_param;
self.body.visit(v, w)?;
write!(w, "end ")
}
}
pub struct LuaJIT<'a> {
wasm: &'a Module,
arity: Arities,
}
impl<'a> LuaJIT<'a> {
fn gen_import_of<T>(&self, w: Writer, lower: &str, cond: T) -> Result<()>
where
T: Fn(&External) -> bool,
{
let import = match self.wasm.import_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
let upper = lower.to_uppercase();
for (i, v) in import.iter().filter(|v| cond(v.external())).enumerate() {
let field = v.field();
let module = v.module();
write!(w, "{}[{}] = wasm.{}.{}.{} ", upper, i, module, lower, field)?;
}
Ok(())
}
fn gen_export_of<T>(&self, w: Writer, lower: &str, cond: T) -> Result<()>
where
T: Fn(&Internal) -> bool,
{
let export = match self.wasm.export_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
let upper = lower.to_uppercase();
write!(w, "{} = {{", lower)?;
for v in export.iter().filter(|v| cond(v.internal())) {
let field = v.field();
let index = aux_internal_index(*v.internal());
write!(w, "{} = {}[{}],", field, upper, index)?;
}
write!(w, "}},")
}
fn gen_import_list(&self, w: Writer) -> Result<()> {
self.gen_import_of(w, "func_list", |v| matches!(v, External::Function(_)))?;
self.gen_import_of(w, "table_list", |v| matches!(v, External::Table(_)))?;
self.gen_import_of(w, "memory_list", |v| matches!(v, External::Memory(_)))?;
self.gen_import_of(w, "global_list", |v| matches!(v, External::Global(_)))
}
fn gen_export_list(&self, w: Writer) -> Result<()> {
self.gen_export_of(w, "func_list", |v| matches!(v, Internal::Function(_)))?;
self.gen_export_of(w, "table_list", |v| matches!(v, Internal::Table(_)))?;
self.gen_export_of(w, "memory_list", |v| matches!(v, Internal::Memory(_)))?;
self.gen_export_of(w, "global_list", |v| matches!(v, Internal::Global(_)))
}
fn gen_table_list(&self, w: Writer) -> Result<()> {
let table = match self.wasm.table_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
let offset = self.wasm.import_count(ImportCountType::Table);
for (i, v) in table.iter().enumerate() {
let index = i + offset;
write!(w, "TABLE_LIST[{}] =", index)?;
write_table_init(v.limits(), w)?;
}
Ok(())
}
fn gen_memory_list(&self, w: Writer) -> Result<()> {
let memory = match self.wasm.memory_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
let offset = self.wasm.import_count(ImportCountType::Memory);
for (i, v) in memory.iter().enumerate() {
let index = i + offset;
write!(w, "MEMORY_LIST[{}] =", index)?;
write_memory_init(v.limits(), w)?;
}
Ok(())
}
fn gen_global_list(&self, w: Writer) -> Result<()> {
let global = match self.wasm.global_section() {
Some(v) => v,
None => return Ok(()),
};
let offset = self.wasm.import_count(ImportCountType::Global);
for (i, v) in global.entries().iter().enumerate() {
let index = i + offset;
write!(w, "GLOBAL_LIST[{}] = {{ value =", index)?;
write_expression(v.init_expr().code(), w)?;
write!(w, "}}")?;
}
Ok(())
}
fn gen_element_list(&self, w: Writer) -> Result<()> {
let element = match self.wasm.elements_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
for v in element {
write!(w, "do ")?;
write!(w, "local target = TABLE_LIST[{}].data ", v.index())?;
write!(w, "local offset =")?;
write_expression(v.offset().as_ref().unwrap().code(), w)?;
write!(w, "local data = {{")?;
v.members()
.iter()
.try_for_each(|v| write!(w, "FUNC_LIST[{}],", v))?;
write!(w, "}}")?;
write!(w, "table.move(data, 1, #data, offset, target)")?;
write!(w, "end ")?;
}
Ok(())
}
fn gen_data_list(&self, w: Writer) -> Result<()> {
let data = match self.wasm.data_section() {
Some(v) => v.entries(),
None => return Ok(()),
};
for v in data {
write!(w, "do ")?;
write!(w, "local target = MEMORY_LIST[{}]", v.index())?;
write!(w, "local offset =")?;
write_expression(v.offset().as_ref().unwrap().code(), w)?;
write!(w, "local data = \"")?;
v.value()
.iter()
.try_for_each(|v| write!(w, "\\x{:02X}", v))?;
write!(w, "\"")?;
write!(w, "rt.memory.init(target, offset, data)")?;
write!(w, "end ")?;
}
Ok(())
}
fn gen_start_point(&self, w: Writer) -> Result<()> {
write!(w, "local function run_init_code()")?;
self.gen_table_list(w)?;
self.gen_memory_list(w)?;
self.gen_global_list(w)?;
self.gen_element_list(w)?;
self.gen_data_list(w)?;
write!(w, "end ")?;
write!(w, "return function(wasm)")?;
self.gen_import_list(w)?;
write!(w, "run_init_code()")?;
if let Some(start) = self.wasm.start_section() {
write!(w, "FUNC_LIST[{}]()", start)?;
}
write!(w, "return {{")?;
self.gen_export_list(w)?;
write!(w, "}} end ")
}
fn gen_localize(func_list: &[Function], w: Writer) -> Result<()> {
let mut loc_set = BTreeSet::new();
for func in func_list {
loc_set.extend(localize::visit(func));
}
loc_set
.into_iter()
.try_for_each(|(a, b)| write!(w, "local {0}_{1} = rt.{0}.{1} ", a, b))
}
// FIXME: Make `pub` only for fuzzing.
#[must_use]
pub fn build_func_list(&self) -> Vec<Function> {
let range = 0..self.arity.len_in();
range
.map(|i| Builder::new(self.wasm, &self.arity).consume(i))
.collect()
}
/// # Errors
/// Returns `Err` if writing to `Writer` failed.
///
/// # Panics
/// If the number of functions overflows 32 bits.
pub fn gen_func_list(&self, func_list: &[Function], w: Writer) -> Result<()> {
let o = self.arity.len_ex();
func_list.iter().enumerate().try_for_each(|(i, v)| {
write_func_name(self.wasm, i.try_into().unwrap(), o.try_into().unwrap(), w)?;
v.visit(&mut Visitor::default(), w)
})
}
}
fn write_list(name: &str, len: usize, w: Writer) -> Result<()> {
let hash = len.min(1);
let len = len.saturating_sub(1);
write!(w, "local {} = table_new({}, {})", name, len, hash)
}
impl<'a> Transpiler<'a> for LuaJIT<'a> {
fn new(wasm: &'a Module) -> Self {
let arity = Arities::new(wasm);
Self { wasm, arity }
}
fn transpile(&self, w: Writer) -> Result<()> {
write!(w, "local rt = require(\"luajit\")")?;
let func_list = self.build_func_list();
Self::gen_localize(&func_list, w)?;
write!(w, "local table_new = require(\"table.new\")")?;
write_list("FUNC_LIST", self.wasm.functions_space(), w)?;
write_list("TABLE_LIST", self.wasm.table_space(), w)?;
write_list("MEMORY_LIST", self.wasm.memory_space(), w)?;
write_list("GLOBAL_LIST", self.wasm.globals_space(), w)?;
self.gen_func_list(&func_list, w)?;
self.gen_start_point(w)
}
}