cranelift/tests/disas.rs


								//! A filetest-lookalike test suite using Cranelift tooling but built on

								//! Wasmtime's code generator.

								//!

								//! This test will read the `tests/disas/*` directory and interpret all files in

								//! that directory as a test. Each test must be in the wasm text format and

								//! start with directives that look like:

								//!

								//! ```wasm

								//! ;;! target = "x86_64"

								//! ;;! compile = true

								//!

								//! (module

								//!     ;; ...

								//! )

								//! ```

								//!

								//! Tests must configure a `target` and then can optionally specify a kind of

								//! test:

								//!

								//! * No specifier - the output CLIF from translation is inspected.

								//! * `optimize = true` - CLIF is emitted, then optimized, then inspected.

								//! * `compile = true` - backends are run to produce machine code and that's inspected.

								//!

								//! Tests may also have a `flags` directive which are CLI flags to Wasmtime

								//! itself:

								//!

								//! ```wasm

								//! ;;! target = "x86_64"

								//! ;;! flags = "-O opt-level=s"

								//!

								//! (module

								//!     ;; ...

								//! )

								//! ```

								//!

								//! Flags are parsed by the `wasmtime_cli_flags` crate to build a `Config`.

								//!

								//! Configuration of tests is prefixed with `;;!` comments and must be present

								//! at the start of the file. These comments are then parsed as TOML and

								//! deserialized into `TestConfig` in this crate.


								use anyhow::{bail, Context, Result};

								use clap::Parser;

								use cranelift_codegen::ir::{Function, UserExternalName, UserFuncName};

								use cranelift_codegen::isa::{lookup_by_name, TargetIsa};

								use cranelift_codegen::settings::{Configurable, Flags, SetError};

								use libtest_mimic::{Arguments, Trial};

								use serde::de::DeserializeOwned;

								use serde_derive::Deserialize;

								use similar::TextDiff;

								use std::fmt::Write;

								use std::path::{Path, PathBuf};

								use std::sync::Arc;

								use tempfile::TempDir;

								use wasmtime::{Engine, OptLevel, Strategy};

								use wasmtime_cli_flags::CommonOptions;


								fn main() -> Result<()> {

								    if cfg!(miri) {

								        return Ok(());

								    }


								    let mut tests = Vec::new();

								    find_tests("./tests/disas".as_ref(), &mut tests)?;


								    let mut trials = Vec::new();

								    for test in tests {

								        trials.push(Trial::test(test.to_str().unwrap().to_string(), move || {

								            run_test(&test)

								                .with_context(|| format!("failed to run tests {test:?}"))

								                .map_err(|e| format!("{e:?}").into())

								        }))

								    }


								    // These tests have some long names so use the "quiet" output by default.

								    let mut arguments = Arguments::parse();

								    if arguments.format.is_none() {

								        arguments.quiet = true;

								    }

								    libtest_mimic::run(&arguments, trials).exit()

								}


								fn find_tests(path: &Path, dst: &mut Vec<PathBuf>) -> Result<()> {

								    for file in path

								        .read_dir()

								        .with_context(|| format!("failed to read {path:?}"))?

								    {

								        let file = file.context("failed to read directory entry")?;

								        let path = file.path();

								        if file.file_type()?.is_dir() {

								            find_tests(&path, dst)?;

								        } else if path.extension().and_then(|s| s.to_str()) == Some("wat") {

								            dst.push(path);

								        }

								    }

								    Ok(())

								}


								fn run_test(path: &Path) -> Result<()> {

								    let mut test = Test::new(path)?;

								    let output = test.compile()?;

								    let isa = test.build_target_isa()?;


								    assert_output(&test.path, &test.contents, &*isa, test.config.test, output)?;


								    Ok(())

								}

								#[derive(Debug, Deserialize)]

								#[serde(deny_unknown_fields)]

								struct TestConfig {

								    target: String,

								    #[serde(default)]

								    test: TestKind,

								    flags: Option<TestConfigFlags>,

								}


								#[derive(Debug, Deserialize)]

								#[serde(untagged)]

								enum TestConfigFlags {

								    SpaceSeparated(String),

								    List(Vec<String>),

								}


								struct Test {

								    path: PathBuf,

								    contents: String,

								    opts: CommonOptions,

								    config: TestConfig,

								}


								/// Which kind of test is being performed.

								#[derive(Default, Debug, Deserialize)]

								#[serde(rename_all = "lowercase")]

								enum TestKind {

								    /// Test the CLIF output, raw from translation.

								    #[default]

								    Clif,

								    /// Compile output to machine code.

								    Compile,

								    /// Test the CLIF output, optimized.

								    Optimize,

								    /// Alias for "compile" plus `-C compiler=winch`

								    Winch,

								}


								impl Test {

								    /// Parse the contents of `path` looking for directive-based comments

								    /// starting with `;;!` near the top of the file.

								    fn new(path: &Path) -> Result<Test> {

								        let contents =

								            std::fs::read_to_string(path).with_context(|| format!("failed to read {path:?}"))?;

								        let config: TestConfig = Test::parse_test_config(&contents)

								            .context("failed to parse test configuration as TOML")?;

								        let mut flags = vec!["wasmtime"];

								        match &config.flags {

								            Some(TestConfigFlags::SpaceSeparated(s)) => flags.extend(s.split_whitespace()),

								            Some(TestConfigFlags::List(s)) => flags.extend(s.iter().map(|s| s.as_str())),

								            None => {}

								        }

								        let opts = wasmtime_cli_flags::CommonOptions::try_parse_from(&flags)?;


								        Ok(Test {

								            path: path.to_path_buf(),

								            config,

								            opts,

								            contents,

								        })

								    }


								    /// Parse test configuration from the specified test, comments starting with

								    /// `;;!`.

								    fn parse_test_config<T>(wat: &str) -> Result<T>

								    where

								        T: DeserializeOwned,

								    {

								        // The test config source is the leading lines of the WAT file that are

								        // prefixed with `;;!`.

								        let config_lines: Vec<_> = wat

								            .lines()

								            .take_while(|l| l.starts_with(";;!"))

								            .map(|l| &l[3..])

								            .collect();

								        let config_text = config_lines.join("\n");


								        toml::from_str(&config_text).context("failed to parse the test configuration")

								    }


								    /// Generates CLIF for all the wasm functions in this test.

								    fn compile(&mut self) -> Result<CompileOutput> {

								        // Use wasmtime::Config with its `emit_clif` option to get Wasmtime's

								        // code generator to jettison CLIF out the back.

								        let tempdir = TempDir::new().context("failed to make a tempdir")?;

								        let mut config = self.opts.config(Some(&self.config.target), None)?;

								        match self.config.test {

								            TestKind::Clif | TestKind::Optimize => {

								                config.emit_clif(tempdir.path());

								            }

								            TestKind::Compile => {}

								            TestKind::Winch => {

								                config.strategy(Strategy::Winch);

								            }

								        }

								        let engine = Engine::new(&config).context("failed to create engine")?;

								        let module = wat::parse_file(&self.path)?;

								        let elf = engine

								            .precompile_module(&module)

								            .context("failed to compile module")?;


								        match self.config.test {

								            TestKind::Clif | TestKind::Optimize => {

								                // Read all `*.clif` files from the clif directory that the

								                // compilation process just emitted.

								                let mut clifs = Vec::new();

								                for entry in tempdir

								                    .path()

								                    .read_dir()

								                    .context("failed to read tempdir")?

								                {

								                    let entry = entry.context("failed to iterate over tempdir")?;

								                    let path = entry.path();

								                    let clif = std::fs::read_to_string(&path)

								                        .with_context(|| format!("failed to read clif file {path:?}"))?;

								                    clifs.push(clif);

								                }


								                // Parse the text format CLIF which is emitted by Wasmtime back

								                // into in-memory data structures.

								                let mut functions = clifs

								                    .iter()

								                    .map(|clif| {

								                        let mut funcs = cranelift_reader::parse_functions(clif)?;

								                        if funcs.len() != 1 {

								                            bail!("expected one function per clif");

								                        }

								                        Ok(funcs.remove(0))

								                    })

								                    .collect::<Result<Vec<_>>>()?;

								                functions.sort_by_key(|f| match f.name {

								                    UserFuncName::User(UserExternalName { namespace, index }) => (namespace, index),

								                    UserFuncName::Testcase(_) => unreachable!(),

								                });

								                Ok(CompileOutput::Clif(functions))

								            }

								            TestKind::Compile | TestKind::Winch => Ok(CompileOutput::Elf(elf)),

								        }

								    }


								    /// Use the test configuration present with CLI flags to build a

								    /// `TargetIsa` to compile/optimize the CLIF.

								    fn build_target_isa(&self) -> Result<Arc<dyn TargetIsa>> {

								        let mut builder = lookup_by_name(&self.config.target)?;

								        let mut flags = cranelift_codegen::settings::builder();

								        let opt_level = match self.opts.opts.opt_level {

								            None | Some(OptLevel::Speed) => "speed",

								            Some(OptLevel::SpeedAndSize) => "speed_and_size",

								            Some(OptLevel::None) => "none",

								            _ => unreachable!(),

								        };

								        flags.set("opt_level", opt_level)?;

								        for (key, val) in self.opts.codegen.cranelift.iter() {

								            let key = &key.replace("-", "_");

								            let target_res = match val {

								                Some(val) => builder.set(key, val),

								                None => builder.enable(key),

								            };

								            match target_res {

								                Ok(()) => continue,

								                Err(SetError::BadName(_)) => {}

								                Err(e) => bail!(e),

								            }

								            match val {

								                Some(val) => flags.set(key, val)?,

								                None => flags.enable(key)?,

								            }

								        }

								        let isa = builder.finish(Flags::new(flags))?;

								        Ok(isa)

								    }

								}


								enum CompileOutput {

								    Clif(Vec<Function>),

								    Elf(Vec<u8>),

								}


								/// Assert that `wat` contains the test expectations necessary for `funcs`.

								fn assert_output(

								    path: &Path,

								    wat: &str,

								    isa: &dyn TargetIsa,

								    kind: TestKind,

								    output: CompileOutput,

								) -> Result<()> {

								    let mut actual = String::new();

								    match output {

								        CompileOutput::Clif(funcs) => {

								            for mut func in funcs {

								                match kind {

								                    TestKind::Compile | TestKind::Winch => unreachable!(),

								                    TestKind::Optimize => {

								                        let mut ctx = cranelift_codegen::Context::for_function(func.clone());

								                        ctx.optimize(isa, &mut Default::default())

								                            .map_err(|e| codegen_error_to_anyhow_error(&ctx.func, e))?;

								                        ctx.func.dfg.resolve_all_aliases();

								                        writeln!(&mut actual, "{}", ctx.func.display()).unwrap();

								                    }

								                    TestKind::Clif => {

								                        func.dfg.resolve_all_aliases();

								                        writeln!(&mut actual, "{}", func.display()).unwrap();

								                    }

								                }

								            }

								        }

								        CompileOutput::Elf(bytes) => {

								            let disas = isa.to_capstone()?;

								            disas_elf(&disas, &mut actual, &bytes)?;

								        }

								    }

								    let actual = actual.trim();

								    assert_or_bless_output(path, wat, actual)

								}


								fn disas_elf(disas: &capstone::Capstone, result: &mut String, elf: &[u8]) -> Result<()> {

								    use capstone::InsnGroupType::{CS_GRP_JUMP, CS_GRP_RET};

								    use object::{Endianness, Object, ObjectSection, ObjectSymbol};


								    let elf = object::read::elf::ElfFile64::<Endianness>::parse(elf)?;

								    let text = elf.section_by_name(".text").unwrap();

								    let text = text.data()?;

								    let mut first = true;

								    for sym in elf.symbols() {

								        let name = match sym.name() {

								            Ok(name) => name,

								            Err(_) => continue,

								        };

								        if !name.contains("wasm") || !name.contains("function") {

								            continue;

								        }


								        let bytes = &text[sym.address() as usize..][..sym.size() as usize];


								        if first {

								            first = false;

								        } else {

								            result.push_str("\n");

								        }

								        writeln!(result, "{name}:")?;


								        // By default don't write all the offsets of all the instructions. That

								        // means that small changes in the instruction sequence cause large

								        // diffs which aren't always the most readable. As a rough balance,

								        // print offset of instructions-after-jumps and anything-after-ret as

								        // that's a decent-enough heuristic for jump targets.

								        let mut prev_jump = false;

								        let mut write_offsets = false;


								        for inst in disas.disasm_all(bytes, sym.address())?.iter() {

								            let detail = disas.insn_detail(&inst).ok();

								            let detail = detail.as_ref();

								            let is_jump = detail

								                .map(|d| {

								                    d.groups()

								                        .iter()

								                        .find(|g| g.0 as u32 == CS_GRP_JUMP)

								                        .is_some()

								                })

								                .unwrap_or(false);


								            if write_offsets || (prev_jump && !is_jump) {

								                write!(result, "{:>4x}: ", inst.address())?;

								            } else {

								                write!(result, "      ")?;

								            }


								            match (inst.mnemonic(), inst.op_str()) {

								                (Some(i), Some(o)) => {

								                    if o.is_empty() {

								                        writeln!(result, "{i}")?;

								                    } else {

								                        writeln!(result, "{i:7} {o}")?;

								                    }

								                }

								                (Some(i), None) => writeln!(result, "{i}")?,

								                _ => unreachable!(),

								            }


								            prev_jump = is_jump;


								            // Flip write_offsets to true once we've seen a `ret`, as

								            // instructions that follow the return are often related to trap

								            // tables.

								            write_offsets = write_offsets

								                || detail

								                    .map(|d| {

								                        d.groups()

								                            .iter()

								                            .find(|g| g.0 as u32 == CS_GRP_RET)

								                            .is_some()

								                    })

								                    .unwrap_or(false);

								        }

								    }

								    Ok(())

								}


								fn assert_or_bless_output(path: &Path, wat: &str, actual: &str) -> Result<()> {

								    log::debug!("=== actual ===\n{actual}");

								    // The test's expectation is the final comment.

								    let mut expected_lines: Vec<_> = wat

								        .lines()

								        .rev()

								        .map_while(|l| l.strip_prefix(";;"))

								        .map(|l| l.strip_prefix(" ").unwrap_or(l))

								        .collect();

								    expected_lines.reverse();

								    let expected = expected_lines.join("\n");

								    let expected = expected.trim();

								    log::debug!("=== expected ===\n{expected}");


								    if actual == expected {

								        return Ok(());

								    }


								    if std::env::var("WASMTIME_TEST_BLESS").unwrap_or_default() == "1" {

								        let old_expectation_line_count = wat

								            .lines()

								            .rev()

								            .take_while(|l| l.starts_with(";;"))

								            .count();

								        let old_wat_line_count = wat.lines().count();

								        let new_wat_lines: Vec<_> = wat

								            .lines()

								            .take(old_wat_line_count - old_expectation_line_count)

								            .map(|l| l.to_string())

								            .chain(actual.lines().map(|l| {

								                if l.is_empty() {

								                    ";;".to_string()

								                } else {

								                    format!(";; {l}")

								                }

								            }))

								            .collect();

								        let mut new_wat = new_wat_lines.join("\n");

								        new_wat.push('\n');

								        std::fs::write(path, new_wat)

								            .with_context(|| format!("failed to write file: {}", path.display()))?;

								        return Ok(());

								    }


								    bail!(

								        "Did not get the expected CLIF translation:\n\n\

								         {}\n\n\

								         Note: You can re-run with the `WASMTIME_TEST_BLESS=1` environment\n\

								         variable set to update test expectations.",

								        TextDiff::from_lines(expected, actual)

								            .unified_diff()

								            .header("expected", "actual")

								    )

								}


								fn codegen_error_to_anyhow_error(

								    func: &cranelift_codegen::ir::Function,

								    err: cranelift_codegen::CodegenError,

								) -> anyhow::Error {

								    let s = cranelift_codegen::print_errors::pretty_error(func, err);

								    anyhow::anyhow!("{}", s)

								}