You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 

467 lines
16 KiB

//! A filetest-lookalike test suite using Cranelift tooling but built on
//! Wasmtime's code generator.
//!
//! This test will read the `tests/disas/*` directory and interpret all files in
//! that directory as a test. Each test must be in the wasm text format and
//! start with directives that look like:
//!
//! ```wasm
//! ;;! target = "x86_64"
//! ;;! compile = true
//!
//! (module
//! ;; ...
//! )
//! ```
//!
//! Tests must configure a `target` and then can optionally specify a kind of
//! test:
//!
//! * No specifier - the output CLIF from translation is inspected.
//! * `optimize = true` - CLIF is emitted, then optimized, then inspected.
//! * `compile = true` - backends are run to produce machine code and that's inspected.
//!
//! Tests may also have a `flags` directive which are CLI flags to Wasmtime
//! itself:
//!
//! ```wasm
//! ;;! target = "x86_64"
//! ;;! flags = "-O opt-level=s"
//!
//! (module
//! ;; ...
//! )
//! ```
//!
//! Flags are parsed by the `wasmtime_cli_flags` crate to build a `Config`.
//!
//! Configuration of tests is prefixed with `;;!` comments and must be present
//! at the start of the file. These comments are then parsed as TOML and
//! deserialized into `TestConfig` in this crate.
use anyhow::{bail, Context, Result};
use clap::Parser;
use cranelift_codegen::ir::{Function, UserExternalName, UserFuncName};
use cranelift_codegen::isa::{lookup_by_name, TargetIsa};
use cranelift_codegen::settings::{Configurable, Flags, SetError};
use libtest_mimic::{Arguments, Trial};
use serde::de::DeserializeOwned;
use serde_derive::Deserialize;
use similar::TextDiff;
use std::fmt::Write;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use tempfile::TempDir;
use wasmtime::{Engine, OptLevel, Strategy};
use wasmtime_cli_flags::CommonOptions;
fn main() -> Result<()> {
if cfg!(miri) {
return Ok(());
}
let mut tests = Vec::new();
find_tests("./tests/disas".as_ref(), &mut tests)?;
let mut trials = Vec::new();
for test in tests {
trials.push(Trial::test(test.to_str().unwrap().to_string(), move || {
run_test(&test)
.with_context(|| format!("failed to run tests {test:?}"))
.map_err(|e| format!("{e:?}").into())
}))
}
// These tests have some long names so use the "quiet" output by default.
let mut arguments = Arguments::parse();
if arguments.format.is_none() {
arguments.quiet = true;
}
libtest_mimic::run(&arguments, trials).exit()
}
fn find_tests(path: &Path, dst: &mut Vec<PathBuf>) -> Result<()> {
for file in path
.read_dir()
.with_context(|| format!("failed to read {path:?}"))?
{
let file = file.context("failed to read directory entry")?;
let path = file.path();
if file.file_type()?.is_dir() {
find_tests(&path, dst)?;
} else if path.extension().and_then(|s| s.to_str()) == Some("wat") {
dst.push(path);
}
}
Ok(())
}
fn run_test(path: &Path) -> Result<()> {
let mut test = Test::new(path)?;
let output = test.compile()?;
let isa = test.build_target_isa()?;
assert_output(&test.path, &test.contents, &*isa, test.config.test, output)?;
Ok(())
}
#[derive(Debug, Deserialize)]
#[serde(deny_unknown_fields)]
struct TestConfig {
target: String,
#[serde(default)]
test: TestKind,
flags: Option<TestConfigFlags>,
}
#[derive(Debug, Deserialize)]
#[serde(untagged)]
enum TestConfigFlags {
SpaceSeparated(String),
List(Vec<String>),
}
struct Test {
path: PathBuf,
contents: String,
opts: CommonOptions,
config: TestConfig,
}
/// Which kind of test is being performed.
#[derive(Default, Debug, Deserialize)]
#[serde(rename_all = "lowercase")]
enum TestKind {
/// Test the CLIF output, raw from translation.
#[default]
Clif,
/// Compile output to machine code.
Compile,
/// Test the CLIF output, optimized.
Optimize,
/// Alias for "compile" plus `-C compiler=winch`
Winch,
}
impl Test {
/// Parse the contents of `path` looking for directive-based comments
/// starting with `;;!` near the top of the file.
fn new(path: &Path) -> Result<Test> {
let contents =
std::fs::read_to_string(path).with_context(|| format!("failed to read {path:?}"))?;
let config: TestConfig = Test::parse_test_config(&contents)
.context("failed to parse test configuration as TOML")?;
let mut flags = vec!["wasmtime"];
match &config.flags {
Some(TestConfigFlags::SpaceSeparated(s)) => flags.extend(s.split_whitespace()),
Some(TestConfigFlags::List(s)) => flags.extend(s.iter().map(|s| s.as_str())),
None => {}
}
let opts = wasmtime_cli_flags::CommonOptions::try_parse_from(&flags)?;
Ok(Test {
path: path.to_path_buf(),
config,
opts,
contents,
})
}
/// Parse test configuration from the specified test, comments starting with
/// `;;!`.
fn parse_test_config<T>(wat: &str) -> Result<T>
where
T: DeserializeOwned,
{
// The test config source is the leading lines of the WAT file that are
// prefixed with `;;!`.
let config_lines: Vec<_> = wat
.lines()
.take_while(|l| l.starts_with(";;!"))
.map(|l| &l[3..])
.collect();
let config_text = config_lines.join("\n");
toml::from_str(&config_text).context("failed to parse the test configuration")
}
/// Generates CLIF for all the wasm functions in this test.
fn compile(&mut self) -> Result<CompileOutput> {
// Use wasmtime::Config with its `emit_clif` option to get Wasmtime's
// code generator to jettison CLIF out the back.
let tempdir = TempDir::new().context("failed to make a tempdir")?;
let mut config = self.opts.config(Some(&self.config.target), None)?;
match self.config.test {
TestKind::Clif | TestKind::Optimize => {
config.emit_clif(tempdir.path());
}
TestKind::Compile => {}
TestKind::Winch => {
config.strategy(Strategy::Winch);
}
}
let engine = Engine::new(&config).context("failed to create engine")?;
let module = wat::parse_file(&self.path)?;
let elf = engine
.precompile_module(&module)
.context("failed to compile module")?;
match self.config.test {
TestKind::Clif | TestKind::Optimize => {
// Read all `*.clif` files from the clif directory that the
// compilation process just emitted.
let mut clifs = Vec::new();
for entry in tempdir
.path()
.read_dir()
.context("failed to read tempdir")?
{
let entry = entry.context("failed to iterate over tempdir")?;
let path = entry.path();
let clif = std::fs::read_to_string(&path)
.with_context(|| format!("failed to read clif file {path:?}"))?;
clifs.push(clif);
}
// Parse the text format CLIF which is emitted by Wasmtime back
// into in-memory data structures.
let mut functions = clifs
.iter()
.map(|clif| {
let mut funcs = cranelift_reader::parse_functions(clif)?;
if funcs.len() != 1 {
bail!("expected one function per clif");
}
Ok(funcs.remove(0))
})
.collect::<Result<Vec<_>>>()?;
functions.sort_by_key(|f| match f.name {
UserFuncName::User(UserExternalName { namespace, index }) => (namespace, index),
UserFuncName::Testcase(_) => unreachable!(),
});
Ok(CompileOutput::Clif(functions))
}
TestKind::Compile | TestKind::Winch => Ok(CompileOutput::Elf(elf)),
}
}
/// Use the test configuration present with CLI flags to build a
/// `TargetIsa` to compile/optimize the CLIF.
fn build_target_isa(&self) -> Result<Arc<dyn TargetIsa>> {
let mut builder = lookup_by_name(&self.config.target)?;
let mut flags = cranelift_codegen::settings::builder();
let opt_level = match self.opts.opts.opt_level {
None | Some(OptLevel::Speed) => "speed",
Some(OptLevel::SpeedAndSize) => "speed_and_size",
Some(OptLevel::None) => "none",
_ => unreachable!(),
};
flags.set("opt_level", opt_level)?;
for (key, val) in self.opts.codegen.cranelift.iter() {
let key = &key.replace("-", "_");
let target_res = match val {
Some(val) => builder.set(key, val),
None => builder.enable(key),
};
match target_res {
Ok(()) => continue,
Err(SetError::BadName(_)) => {}
Err(e) => bail!(e),
}
match val {
Some(val) => flags.set(key, val)?,
None => flags.enable(key)?,
}
}
let isa = builder.finish(Flags::new(flags))?;
Ok(isa)
}
}
enum CompileOutput {
Clif(Vec<Function>),
Elf(Vec<u8>),
}
/// Assert that `wat` contains the test expectations necessary for `funcs`.
fn assert_output(
path: &Path,
wat: &str,
isa: &dyn TargetIsa,
kind: TestKind,
output: CompileOutput,
) -> Result<()> {
let mut actual = String::new();
match output {
CompileOutput::Clif(funcs) => {
for mut func in funcs {
match kind {
TestKind::Compile | TestKind::Winch => unreachable!(),
TestKind::Optimize => {
let mut ctx = cranelift_codegen::Context::for_function(func.clone());
ctx.optimize(isa, &mut Default::default())
.map_err(|e| codegen_error_to_anyhow_error(&ctx.func, e))?;
ctx.func.dfg.resolve_all_aliases();
writeln!(&mut actual, "{}", ctx.func.display()).unwrap();
}
TestKind::Clif => {
func.dfg.resolve_all_aliases();
writeln!(&mut actual, "{}", func.display()).unwrap();
}
}
}
}
CompileOutput::Elf(bytes) => {
let disas = isa.to_capstone()?;
disas_elf(&disas, &mut actual, &bytes)?;
}
}
let actual = actual.trim();
assert_or_bless_output(path, wat, actual)
}
fn disas_elf(disas: &capstone::Capstone, result: &mut String, elf: &[u8]) -> Result<()> {
use capstone::InsnGroupType::{CS_GRP_JUMP, CS_GRP_RET};
use object::{Endianness, Object, ObjectSection, ObjectSymbol};
let elf = object::read::elf::ElfFile64::<Endianness>::parse(elf)?;
let text = elf.section_by_name(".text").unwrap();
let text = text.data()?;
let mut first = true;
for sym in elf.symbols() {
let name = match sym.name() {
Ok(name) => name,
Err(_) => continue,
};
if !name.contains("wasm") || !name.contains("function") {
continue;
}
let bytes = &text[sym.address() as usize..][..sym.size() as usize];
if first {
first = false;
} else {
result.push_str("\n");
}
writeln!(result, "{name}:")?;
// By default don't write all the offsets of all the instructions. That
// means that small changes in the instruction sequence cause large
// diffs which aren't always the most readable. As a rough balance,
// print offset of instructions-after-jumps and anything-after-ret as
// that's a decent-enough heuristic for jump targets.
let mut prev_jump = false;
let mut write_offsets = false;
for inst in disas.disasm_all(bytes, sym.address())?.iter() {
let detail = disas.insn_detail(&inst).ok();
let detail = detail.as_ref();
let is_jump = detail
.map(|d| {
d.groups()
.iter()
.find(|g| g.0 as u32 == CS_GRP_JUMP)
.is_some()
})
.unwrap_or(false);
if write_offsets || (prev_jump && !is_jump) {
write!(result, "{:>4x}: ", inst.address())?;
} else {
write!(result, " ")?;
}
match (inst.mnemonic(), inst.op_str()) {
(Some(i), Some(o)) => {
if o.is_empty() {
writeln!(result, "{i}")?;
} else {
writeln!(result, "{i:7} {o}")?;
}
}
(Some(i), None) => writeln!(result, "{i}")?,
_ => unreachable!(),
}
prev_jump = is_jump;
// Flip write_offsets to true once we've seen a `ret`, as
// instructions that follow the return are often related to trap
// tables.
write_offsets = write_offsets
|| detail
.map(|d| {
d.groups()
.iter()
.find(|g| g.0 as u32 == CS_GRP_RET)
.is_some()
})
.unwrap_or(false);
}
}
Ok(())
}
fn assert_or_bless_output(path: &Path, wat: &str, actual: &str) -> Result<()> {
log::debug!("=== actual ===\n{actual}");
// The test's expectation is the final comment.
let mut expected_lines: Vec<_> = wat
.lines()
.rev()
.map_while(|l| l.strip_prefix(";;"))
.map(|l| l.strip_prefix(" ").unwrap_or(l))
.collect();
expected_lines.reverse();
let expected = expected_lines.join("\n");
let expected = expected.trim();
log::debug!("=== expected ===\n{expected}");
if actual == expected {
return Ok(());
}
if std::env::var("WASMTIME_TEST_BLESS").unwrap_or_default() == "1" {
let old_expectation_line_count = wat
.lines()
.rev()
.take_while(|l| l.starts_with(";;"))
.count();
let old_wat_line_count = wat.lines().count();
let new_wat_lines: Vec<_> = wat
.lines()
.take(old_wat_line_count - old_expectation_line_count)
.map(|l| l.to_string())
.chain(actual.lines().map(|l| {
if l.is_empty() {
";;".to_string()
} else {
format!(";; {l}")
}
}))
.collect();
let mut new_wat = new_wat_lines.join("\n");
new_wat.push('\n');
std::fs::write(path, new_wat)
.with_context(|| format!("failed to write file: {}", path.display()))?;
return Ok(());
}
bail!(
"Did not get the expected CLIF translation:\n\n\
{}\n\n\
Note: You can re-run with the `WASMTIME_TEST_BLESS=1` environment\n\
variable set to update test expectations.",
TextDiff::from_lines(expected, actual)
.unified_diff()
.header("expected", "actual")
)
}
fn codegen_error_to_anyhow_error(
func: &cranelift_codegen::ir::Function,
err: cranelift_codegen::CodegenError,
) -> anyhow::Error {
let s = cranelift_codegen::print_errors::pretty_error(func, err);
anyhow::anyhow!("{}", s)
}