diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml
index e99a2c6b3c..8a0686df8d 100644
--- a/.github/workflows/main.yml
+++ b/.github/workflows/main.yml
@@ -164,6 +164,59 @@ jobs:
             | xargs cargo fuzz run differential --release --debug-assertions --features binaryen
       env:
         RUST_BACKTRACE: 1
+    - run: |
+        find fuzz/corpus/peepmatic_compile -type f \
+            | shuf \
+            | head -n 10000 \
+            | xargs cargo fuzz run peepmatic_compile --release --debug-assertions --features binaryen
+      env:
+        RUST_BACKTRACE: 1
+    - run: |
+        find fuzz/corpus/peepmatic_fst_differential -type f \
+            | shuf \
+            | head -n 10000 \
+            | xargs cargo fuzz run peepmatic_fst_differential --release --debug-assertions --features binaryen
+      env:
+        RUST_BACKTRACE: 1
+    - run: |
+        find fuzz/corpus/peepmatic_interp -type f \
+            | shuf \
+            | head -n 5000 \
+            | xargs cargo fuzz run peepmatic_interp --release --debug-assertions --features binaryen
+      env:
+        RUST_BACKTRACE: 1
+    - run: |
+        find fuzz/corpus/peepmatic_parser -type f \
+            | shuf \
+            | head -n 10000 \
+            | xargs cargo fuzz run peepmatic_parser --release --debug-assertions --features binaryen
+      env:
+        RUST_BACKTRACE: 1
+    - run: |
+        find fuzz/corpus/peepmatic_simple_automata -type f \
+            | shuf \
+            | head -n 1000 \
+            | xargs cargo fuzz run peepmatic_simple_automata --release --debug-assertions --features binaryen
+      env:
+        RUST_BACKTRACE: 1
+
+  rebuild_peephole_optimizers:
+    name: Rebuild Peephole Optimizers
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v1
+      with:
+        submodules: true
+    - name: Rebuild peepmatic peephole optimizers
+      run: |
+        cd cranelift/
+        cargo build --features 'enable-peepmatic cranelift-codegen/rebuild-peephole-optimizers'
+    - name: Check that peephole optimizers are up to date
+      run: git diff --exit-code
+    - name: Test with peepmatic
+      run: |
+        cd cranelift/
+        cargo test --features 'enable-peepmatic'
 
   # Perform all tests (debug mode) for `wasmtime`. This runs stable/beta/nightly
   # channels of Rust as well as macOS/Linux/Windows.
@@ -334,11 +387,29 @@ jobs:
     # Build `wasmtime` and executables
     - run: $CENTOS cargo build --release --bin wasmtime
       shell: bash
+
     # Build `libwasmtime.so`
     - run: $CENTOS cargo build --release --manifest-path crates/c-api/Cargo.toml
       shell: bash
-    # Test what we just built
-    - run: $CENTOS cargo test --features test-programs/test_programs --release --all --exclude lightbeam
+
+    # Test what we just built.
+    #
+    # Ignore some optional dependencies that are used by features that aren't
+    # enabled by default, are tested in other, dedicated CI jobs, and which
+    # would increase build times here.
+    - run: |
+        $CENTOS cargo test \
+            --features test-programs/test_programs \
+            --release \
+            --all \
+            --exclude lightbeam \
+            --exclude peepmatic \
+            --exclude peepmatic-automata \
+            --exclude peepmatic-fuzzing \
+            --exclude peepmatic-macro \
+            --exclude peepmatic-runtime \
+            --exclude peepmatic-test \
+            --exclude wasmtime-fuzz
       shell: bash
       env:
         RUST_BACKTRACE: 1
diff --git a/.gitignore b/.gitignore
index 4c37c4f83d..f890733b7d 100644
--- a/.gitignore
+++ b/.gitignore
@@ -14,3 +14,4 @@ docs/book
 rusty-tags.*
 tags
 target
+.z3-trace
diff --git a/Cargo.lock b/Cargo.lock
index c143251096..0a9e38fd62 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -11,9 +11,12 @@ dependencies = [
 
 [[package]]
 name = "ahash"
-version = "0.3.3"
+version = "0.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "35b909d1c126f78ace756fc337133356c499eebeefcce930fa5fb018823f2b2d"
+checksum = "0989268a37e128d4d7a8028f1c60099430113fdbc70419010601ce51a228e4fe"
+dependencies = [
+ "const-random",
+]
 
 [[package]]
 name = "aho-corasick"
@@ -41,9 +44,9 @@ checksum = "d9a60d744a80c30fcb657dfe2c1b22bcb3e814c1a1e3674f32bf5820b570fbff"
 
 [[package]]
 name = "arbitrary"
-version = "0.4.4"
+version = "0.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c5eb01a9ab8a3369f2f7632b9461c34f5920bd454774bab5b9fc6744f21d6143"
+checksum = "75153c95fdedd7db9732dfbfc3702324a1627eec91ba56e37cd0ac78314ab2ed"
 dependencies = [
  "derive_arbitrary",
 ]
@@ -97,9 +100,9 @@ dependencies = [
 
 [[package]]
 name = "backtrace-sys"
-version = "0.1.36"
+version = "0.1.35"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "78848718ee1255a2485d1309ad9cdecfc2e7d0362dd11c6829364c6b35ae1bc7"
+checksum = "7de8aba10a69c8e8d7622c5710229485ec32e9d55fdad160ea559c086fdcd118"
 dependencies = [
  "cc",
  "libc",
@@ -201,6 +204,12 @@ dependencies = [
  "byte-tools",
 ]
 
+[[package]]
+name = "bumpalo"
+version = "3.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "12ae9db68ad7fac5fe51304d20f016c911539251075a214f8e663babefa35187"
+
 [[package]]
 name = "byte-tools"
 version = "0.3.1"
@@ -233,9 +242,9 @@ dependencies = [
 
 [[package]]
 name = "cc"
-version = "1.0.52"
+version = "1.0.50"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c3d87b23d6a92cd03af510a5ade527033f6aa6fa92161e2d5863a907d4c5e31d"
+checksum = "95e28fa049fda1c330bcf9d723be7663a899c4679724b34c81e9f5a326aab8cd"
 dependencies = [
  "jobserver",
 ]
@@ -261,6 +270,18 @@ dependencies = [
  "vec_map",
 ]
 
+[[package]]
+name = "clicolors-control"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "90082ee5dcdd64dc4e9e0d37fbf3ee325419e39c0092191e0393df65518f741e"
+dependencies = [
+ "atty",
+ "lazy_static",
+ "libc",
+ "winapi",
+]
+
 [[package]]
 name = "cloudabi"
 version = "0.0.3"
@@ -281,19 +302,18 @@ dependencies = [
 
 [[package]]
 name = "console"
-version = "0.11.2"
+version = "0.10.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dea0f3e2e8d7dba335e913b97f9e1992c86c4399d54f8be1d31c8727d0652064"
+checksum = "6728a28023f207181b193262711102bfbaf47cc9d13bc71d0736607ef8efe88c"
 dependencies = [
+ "clicolors-control",
  "encode_unicode",
  "lazy_static",
  "libc",
  "regex",
- "terminal_size",
  "termios",
  "unicode-width",
  "winapi",
- "winapi-util",
 ]
 
 [[package]]
@@ -357,8 +377,10 @@ dependencies = [
  "cranelift-codegen-shared",
  "cranelift-entity",
  "gimli",
- "hashbrown 0.7.2",
+ "hashbrown 0.7.1",
  "log",
+ "peepmatic",
+ "peepmatic-runtime",
  "regalloc",
  "serde",
  "smallvec",
@@ -424,7 +446,7 @@ name = "cranelift-frontend"
 version = "0.63.0"
 dependencies = [
  "cranelift-codegen",
- "hashbrown 0.7.2",
+ "hashbrown 0.7.1",
  "log",
  "smallvec",
  "target-lexicon",
@@ -438,7 +460,7 @@ dependencies = [
  "cranelift-entity",
  "cranelift-frontend",
  "cranelift-reader",
- "hashbrown 0.7.2",
+ "hashbrown 0.7.1",
  "log",
  "pretty_env_logger",
  "thiserror",
@@ -566,12 +588,12 @@ dependencies = [
  "cranelift-codegen",
  "cranelift-entity",
  "cranelift-frontend",
- "hashbrown 0.7.2",
+ "hashbrown 0.7.1",
  "log",
  "serde",
  "target-lexicon",
  "thiserror",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wat",
 ]
 
@@ -642,13 +664,13 @@ dependencies = [
 
 [[package]]
 name = "derive_arbitrary"
-version = "0.4.4"
+version = "0.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5cee758ebd1c79a9c6fb95f242dcc30bdbf555c28369ae908d21fdaf81537496"
+checksum = "caedd6a71b6d00bdc458ec8ffbfd12689c1ee7ffa69ad9933310aaf2f08f18d8"
 dependencies = [
  "proc-macro2",
- "quote",
  "syn",
+ "synstructure",
 ]
 
 [[package]]
@@ -877,6 +899,12 @@ version = "1.0.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2fad85553e09a6f881f739c29f0b00b0f01357c743266d478b68951ce23285f3"
 
+[[package]]
+name = "fst"
+version = "0.4.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "81f9cac32c1741cdf6b66be7dcf0d9c7f25ccf12f8aa84c16cfa31f9f14513b3"
+
 [[package]]
 name = "fuchsia-cprng"
 version = "0.1.1"
@@ -952,11 +980,11 @@ dependencies = [
 
 [[package]]
 name = "hashbrown"
-version = "0.7.2"
+version = "0.7.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "96282e96bfcd3da0d3aa9938bedf1e50df3269b6db08b4876d2da0bb1a0841cf"
+checksum = "479e9d9a1a3f8c489868a935b557ab5710e3e223836da2ecd52901d88935cb56"
 dependencies = [
- "ahash 0.3.3",
+ "ahash 0.3.2",
  "autocfg 1.0.0",
 ]
 
@@ -971,9 +999,9 @@ dependencies = [
 
 [[package]]
 name = "hermit-abi"
-version = "0.1.12"
+version = "0.1.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "61565ff7aaace3525556587bd2dc31d4a07071957be715e63ce7b1eccf51a8f4"
+checksum = "725cf19794cf90aa94e65050cb4191ff5d8fa87a498383774c47b332e3af952e"
 dependencies = [
  "libc",
 ]
@@ -1100,7 +1128,7 @@ dependencies = [
  "staticvec",
  "thiserror",
  "typemap",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wat",
 ]
 
@@ -1170,9 +1198,9 @@ dependencies = [
 
 [[package]]
 name = "num_cpus"
-version = "1.13.0"
+version = "1.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "05499f3756671c15885fee9034446956fff3f243d6077b91e5767df161f766b3"
+checksum = "46203554f085ff89c235cd12f7075f3233af9b11ed7c9e16dfe2560d03313ce6"
 dependencies = [
  "hermit-abi",
  "libc",
@@ -1226,6 +1254,76 @@ dependencies = [
  "stable_deref_trait",
 ]
 
+[[package]]
+name = "peepmatic"
+version = "0.1.0"
+dependencies = [
+ "anyhow",
+ "peepmatic-automata",
+ "peepmatic-macro",
+ "peepmatic-runtime",
+ "wast 15.0.0",
+ "z3",
+]
+
+[[package]]
+name = "peepmatic-automata"
+version = "0.1.0"
+dependencies = [
+ "serde",
+]
+
+[[package]]
+name = "peepmatic-fuzzing"
+version = "0.1.0"
+dependencies = [
+ "arbitrary",
+ "bincode",
+ "env_logger 0.7.1",
+ "fst",
+ "log",
+ "peepmatic",
+ "peepmatic-automata",
+ "peepmatic-runtime",
+ "peepmatic-test",
+ "rand 0.7.3",
+ "serde",
+ "wast 15.0.0",
+]
+
+[[package]]
+name = "peepmatic-macro"
+version = "0.1.0"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
+[[package]]
+name = "peepmatic-runtime"
+version = "0.1.0"
+dependencies = [
+ "bincode",
+ "bumpalo",
+ "log",
+ "peepmatic-automata",
+ "peepmatic-macro",
+ "serde",
+ "thiserror",
+ "wast 15.0.0",
+]
+
+[[package]]
+name = "peepmatic-test"
+version = "0.1.0"
+dependencies = [
+ "env_logger 0.7.1",
+ "log",
+ "peepmatic",
+ "peepmatic-runtime",
+]
+
 [[package]]
 name = "plain"
 version = "0.2.3"
@@ -1291,9 +1389,9 @@ dependencies = [
 
 [[package]]
 name = "proptest"
-version = "0.9.6"
+version = "0.9.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "01c477819b845fe023d33583ebf10c9f62518c8d79a0960ba5c36d6ac8a55a5b"
+checksum = "bf6147d103a7c9d7598f4105cf049b15c99e2ecd93179bf024f0fd349be5ada4"
 dependencies = [
  "bit-set",
  "bitflags",
@@ -1350,7 +1448,7 @@ dependencies = [
  "rand_isaac",
  "rand_jitter",
  "rand_os",
- "rand_pcg",
+ "rand_pcg 0.1.2",
  "rand_xorshift",
  "winapi",
 ]
@@ -1366,6 +1464,7 @@ dependencies = [
  "rand_chacha 0.2.2",
  "rand_core 0.5.1",
  "rand_hc 0.2.0",
+ "rand_pcg 0.2.1",
 ]
 
 [[package]]
@@ -1474,6 +1573,15 @@ dependencies = [
  "rand_core 0.4.2",
 ]
 
+[[package]]
+name = "rand_pcg"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "16abd0c1b639e9eb4d7c50c0b8100b0d0f849be2349829c740fe8e6eb4816429"
+dependencies = [
+ "rand_core 0.5.1",
+]
+
 [[package]]
 name = "rand_xorshift"
 version = "0.1.1"
@@ -1557,9 +1665,9 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.3.7"
+version = "1.3.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a6020f034922e3194c711b82a627453881bc4682166cabb07134a10c26ba7692"
+checksum = "7f6946991529684867e47d86474e3a6d0c0ab9b82d5821e314b1ede31fa3a4b3"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -1648,9 +1756,9 @@ dependencies = [
 
 [[package]]
 name = "ryu"
-version = "1.0.4"
+version = "1.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ed3d612bc64430efeb3f7ee6ef26d590dce0c43249217bddc62112540c7941e1"
+checksum = "535622e6be132bccd223f4bb2b8ac8d53cda3c7a6394944d3b2b33fb974f9d76"
 
 [[package]]
 name = "same-file"
@@ -1724,9 +1832,9 @@ dependencies = [
 
 [[package]]
 name = "serde_json"
-version = "1.0.52"
+version = "1.0.51"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a7894c8ed05b7a3a279aeb79025fdec1d3158080b75b98a08faf2806bb799edd"
+checksum = "da07b57ee2623368351e9a0488bb0b261322a15a6e0ae53e243cbdc0f4208da9"
 dependencies = [
  "itoa",
  "ryu",
@@ -1747,9 +1855,9 @@ dependencies = [
 
 [[package]]
 name = "smallvec"
-version = "1.4.0"
+version = "1.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c7cb5678e1615754284ec264d9bb5b4c27d2018577fd90ac0ceb578591ed5ee4"
+checksum = "05720e22615919e4734f6a99ceae50d00226c3c5aca406e102ebc33298214e0a"
 
 [[package]]
 name = "stable_deref_trait"
@@ -1780,9 +1888,9 @@ checksum = "8ea5119cdb4c55b55d432abb513a0429384878c15dde60cc77b1c99de1a95a6a"
 
 [[package]]
 name = "structopt"
-version = "0.3.14"
+version = "0.3.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "863246aaf5ddd0d6928dfeb1a9ca65f505599e4e1b399935ef7e75107516b4ef"
+checksum = "ff6da2e8d107dfd7b74df5ef4d205c6aebee0706c647f6bc6a2d5789905c00fb"
 dependencies = [
  "clap",
  "lazy_static",
@@ -1791,9 +1899,9 @@ dependencies = [
 
 [[package]]
 name = "structopt-derive"
-version = "0.4.7"
+version = "0.4.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d239ca4b13aee7a2142e6795cbd69e457665ff8037aed33b3effdc430d2f927a"
+checksum = "a489c87c08fbaf12e386665109dd13470dcc9c4583ea3e10dd2b4523e5ebd9ac"
 dependencies = [
  "heck",
  "proc-macro-error",
@@ -1804,9 +1912,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "1.0.18"
+version = "1.0.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "410a7488c0a728c7ceb4ad59b9567eb4053d02e8cc7f5c0e0eeeb39518369213"
+checksum = "0df0eb663f387145cab623dea85b09c2c5b4b0aef44e945d928e682fce71bb03"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -1824,6 +1932,18 @@ dependencies = [
  "syn",
 ]
 
+[[package]]
+name = "synstructure"
+version = "0.12.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "67656ea1dc1b41b1451851562ea232ec2e5a80242139f7e679ceccfb5d61f545"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+ "unicode-xid",
+]
+
 [[package]]
 name = "target-lexicon"
 version = "0.10.0"
@@ -1863,16 +1983,6 @@ dependencies = [
  "winapi-util",
 ]
 
-[[package]]
-name = "terminal_size"
-version = "0.1.12"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8038f95fc7a6f351163f4b964af631bd26c9e828f7db085f2a84aca56f70d13b"
-dependencies = [
- "libc",
- "winapi",
-]
-
 [[package]]
 name = "termios"
 version = "0.3.2"
@@ -1909,18 +2019,18 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.16"
+version = "1.0.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d12a1dae4add0f0d568eebc7bf142f145ba1aa2544cafb195c76f0f409091b60"
+checksum = "54b3d3d2ff68104100ab257bb6bb0cb26c901abe4bd4ba15961f3bf867924012"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.16"
+version = "1.0.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3f34e0c1caaa462fd840ec6b768946ea1e7842620d94fe29d5b847138f521269"
+checksum = "ca972988113b7715266f91250ddb98070d033c62a011fa0fcc57434a649310dd"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -1962,9 +2072,9 @@ dependencies = [
 
 [[package]]
 name = "typenum"
-version = "1.12.0"
+version = "1.11.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "373c8a200f9e67a0c95e62a4f52fbf80c23b4381c05a17845531982fa99e6b33"
+checksum = "6d2783fe2d6b8c1101136184eb41be8b1ad379e4657050b8aaff0c79ee7575f9"
 
 [[package]]
 name = "unicode-segmentation"
@@ -2051,6 +2161,12 @@ dependencies = [
  "yanix",
 ]
 
+[[package]]
+name = "wasmparser"
+version = "0.51.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "aeb1956b19469d1c5e63e459d29e7b5aa0f558d9f16fcef09736f8a265e6c10a"
+
 [[package]]
 name = "wasmparser"
 version = "0.52.2"
@@ -2059,12 +2175,12 @@ checksum = "733954023c0b39602439e60a65126fd31b003196d3a1e8e4531b055165a79b31"
 
 [[package]]
 name = "wasmprinter"
-version = "0.2.4"
+version = "0.2.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "21c3ac16b1f882bf1e1ce007e4f194559d2e3332013367863ddfbc828d1f044f"
+checksum = "8bd423d45b95fcee11775472bfdce66c63c45ada23c1b338e0a63d623a6c475b"
 dependencies = [
  "anyhow",
- "wasmparser",
+ "wasmparser 0.51.4",
 ]
 
 [[package]]
@@ -2080,7 +2196,7 @@ dependencies = [
  "rustc-demangle",
  "target-lexicon",
  "tempfile",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wasmtime-environ",
  "wasmtime-jit",
  "wasmtime-profiling",
@@ -2150,7 +2266,7 @@ dependencies = [
  "more-asserts",
  "target-lexicon",
  "thiserror",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wasmtime-environ",
 ]
 
@@ -2181,7 +2297,7 @@ dependencies = [
  "tempfile",
  "thiserror",
  "toml",
- "wasmparser",
+ "wasmparser 0.52.2",
  "winapi",
  "zstd",
 ]
@@ -2194,6 +2310,7 @@ dependencies = [
  "cranelift-reader",
  "cranelift-wasm",
  "libfuzzer-sys",
+ "peepmatic-fuzzing",
  "target-lexicon",
  "wasmtime",
  "wasmtime-fuzzing",
@@ -2209,7 +2326,7 @@ dependencies = [
  "env_logger 0.7.1",
  "log",
  "rayon",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wasmprinter",
  "wasmtime",
  "wasmtime-wast",
@@ -2233,7 +2350,7 @@ dependencies = [
  "region",
  "target-lexicon",
  "thiserror",
- "wasmparser",
+ "wasmparser 0.52.2",
  "wasmtime-debug",
  "wasmtime-environ",
  "wasmtime-profiling",
@@ -2424,9 +2541,9 @@ checksum = "ac3b87c63620426dd9b991e5ce0329eff545bccbbb34f3be09ff6fb6ab51b7b6"
 
 [[package]]
 name = "winapi-util"
-version = "0.1.5"
+version = "0.1.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "70ec6ce85bb158151cae5e5c87f95a8e97d2c0c4b001223f33a334e3ce5de178"
+checksum = "fa515c5163a99cc82bab70fd3bfdd36d827be85de63737b40fcef2ce084a436e"
 dependencies = [
  "winapi",
 ]
@@ -2470,6 +2587,26 @@ dependencies = [
  "log",
 ]
 
+[[package]]
+name = "z3"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ded00cd90f8e3a7ea3155bddd72573f2b099ea201877542d924e47b58dd04e72"
+dependencies = [
+ "lazy_static",
+ "log",
+ "z3-sys",
+]
+
+[[package]]
+name = "z3-sys"
+version = "0.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4002d8a1facb54d02dbfb86151281e5450618ab330936bc2f3acaab31eae11ae"
+dependencies = [
+ "cmake",
+]
+
 [[package]]
 name = "zstd"
 version = "0.5.1+zstd.1.4.4"
diff --git a/cranelift/Cargo.toml b/cranelift/Cargo.toml
index f2e4ea9607..335a69c808 100644
--- a/cranelift/Cargo.toml
+++ b/cranelift/Cargo.toml
@@ -47,4 +47,5 @@ walkdir = "2.2"
 [features]
 default = ["disas", "wasm", "cranelift-codegen/all-arch"]
 disas = ["capstone"]
+enable-peepmatic = ["cranelift-codegen/enable-peepmatic", "cranelift-filetests/enable-peepmatic"]
 wasm = ["wat", "cranelift-wasm"]
diff --git a/cranelift/codegen/Cargo.toml b/cranelift/codegen/Cargo.toml
index 692c85bdd4..0bc1c32006 100644
--- a/cranelift/codegen/Cargo.toml
+++ b/cranelift/codegen/Cargo.toml
@@ -24,6 +24,7 @@ gimli = { version = "0.20.0", default-features = false, features = ["write"], op
 smallvec = { version = "1.0.0" }
 thiserror = "1.0.4"
 byteorder = { version = "1.3.2", default-features = false }
+peepmatic-runtime = { path = "../peepmatic/crates/runtime", optional = true }
 regalloc = "0.0.23"
 # It is a goal of the cranelift-codegen crate to have minimal external dependencies.
 # Please don't add any unless they are essential to the task of creating binary
@@ -32,6 +33,7 @@ regalloc = "0.0.23"
 
 [build-dependencies]
 cranelift-codegen-meta = { path = "meta", version = "0.63.0" }
+peepmatic = { path = "../peepmatic", optional = true }
 
 [features]
 default = ["std", "unwind"]
@@ -72,5 +74,12 @@ all-arch = [
 # For dependent crates that want to serialize some parts of cranelift
 enable-serde = ["serde"]
 
+# Recompile our optimizations that are written in the `peepmatic` DSL into a
+# compact finite-state transducer automaton.
+rebuild-peephole-optimizers = ["peepmatic"]
+
+# Enable the use of `peepmatic`-generated peephole optimizers.
+enable-peepmatic = ["peepmatic-runtime"]
+
 [badges]
 maintenance = { status = "experimental" }
diff --git a/cranelift/codegen/build.rs b/cranelift/codegen/build.rs
index bb14364050..b7352f37c3 100644
--- a/cranelift/codegen/build.rs
+++ b/cranelift/codegen/build.rs
@@ -71,4 +71,22 @@ fn main() {
         );
         println!("cargo:warning=Generated files are in {}", out_dir);
     }
+
+    #[cfg(feature = "rebuild-peephole-optimizers")]
+    rebuild_peephole_optimizers();
+}
+
+#[cfg(feature = "rebuild-peephole-optimizers")]
+fn rebuild_peephole_optimizers() {
+    use std::path::Path;
+
+    let source_path = Path::new("src").join("preopt.peepmatic");
+    println!("cargo:rerun-if-changed={}", source_path.display());
+
+    let preopt =
+        peepmatic::compile_file(&source_path).expect("failed to compile `src/preopt.peepmatic`");
+
+    preopt
+        .serialize_to_file(&Path::new("src").join("preopt.serialized"))
+        .expect("failed to serialize peephole optimizer to `src/preopt.serialized`");
 }
diff --git a/cranelift/codegen/src/ir/dfg.rs b/cranelift/codegen/src/ir/dfg.rs
index 787f519de9..58d101aace 100644
--- a/cranelift/codegen/src/ir/dfg.rs
+++ b/cranelift/codegen/src/ir/dfg.rs
@@ -234,11 +234,7 @@ impl DataFlowGraph {
 
     /// Get the type of a value.
     pub fn value_type(&self, v: Value) -> Type {
-        match self.values[v] {
-            ValueData::Inst { ty, .. }
-            | ValueData::Param { ty, .. }
-            | ValueData::Alias { ty, .. } => ty,
-        }
+        self.values[v].ty()
     }
 
     /// Get the definition of a value.
@@ -383,9 +379,14 @@ pub enum ValueDef {
 impl ValueDef {
     /// Unwrap the instruction where the value was defined, or panic.
     pub fn unwrap_inst(&self) -> Inst {
+        self.inst().expect("Value is not an instruction result")
+    }
+
+    /// Get the instruction where the value was defined, if any.
+    pub fn inst(&self) -> Option<Inst> {
         match *self {
-            Self::Result(inst, _) => inst,
-            _ => panic!("Value is not an instruction result"),
+            Self::Result(inst, _) => Some(inst),
+            _ => None,
         }
     }
 
@@ -428,6 +429,16 @@ enum ValueData {
     Alias { ty: Type, original: Value },
 }
 
+impl ValueData {
+    fn ty(&self) -> Type {
+        match *self {
+            ValueData::Inst { ty, .. }
+            | ValueData::Param { ty, .. }
+            | ValueData::Alias { ty, .. } => ty,
+        }
+    }
+}
+
 /// Instructions.
 ///
 impl DataFlowGraph {
diff --git a/cranelift/codegen/src/ir/function.rs b/cranelift/codegen/src/ir/function.rs
index 892af400af..f425eb669f 100644
--- a/cranelift/codegen/src/ir/function.rs
+++ b/cranelift/codegen/src/ir/function.rs
@@ -308,6 +308,30 @@ impl Function {
         // function, assume it is not a leaf.
         self.dfg.signatures.is_empty()
     }
+
+    /// Replace the `dst` instruction's data with the `src` instruction's data
+    /// and then remove `src`.
+    ///
+    /// `src` and its result values should not be used at all, as any uses would
+    /// be left dangling after calling this method.
+    ///
+    /// `src` and `dst` must have the same number of resulting values, and
+    /// `src`'s i^th value must have the same type as `dst`'s i^th value.
+    pub fn transplant_inst(&mut self, dst: Inst, src: Inst) {
+        debug_assert_eq!(
+            self.dfg.inst_results(dst).len(),
+            self.dfg.inst_results(src).len()
+        );
+        debug_assert!(self
+            .dfg
+            .inst_results(dst)
+            .iter()
+            .zip(self.dfg.inst_results(src))
+            .all(|(a, b)| self.dfg.value_type(*a) == self.dfg.value_type(*b)));
+
+        self.dfg[dst] = self.dfg[src].clone();
+        self.layout.remove_inst(src);
+    }
 }
 
 /// Additional annotations for function display.
diff --git a/cranelift/codegen/src/ir/instructions.rs b/cranelift/codegen/src/ir/instructions.rs
index deb79130d4..1ada09fd71 100644
--- a/cranelift/codegen/src/ir/instructions.rs
+++ b/cranelift/codegen/src/ir/instructions.rs
@@ -11,9 +11,7 @@ use core::fmt::{self, Display, Formatter};
 use core::ops::{Deref, DerefMut};
 use core::str::FromStr;
 
-use crate::ir;
-use crate::ir::types;
-use crate::ir::{Block, FuncRef, JumpTable, SigRef, Type, Value};
+use crate::ir::{self, trapcode::TrapCode, types, Block, FuncRef, JumpTable, SigRef, Type, Value};
 use crate::isa;
 
 use crate::bitset::BitSet;
@@ -257,6 +255,30 @@ impl InstructionData {
         }
     }
 
+    /// If this is a trapping instruction, get its trap code. Otherwise, return
+    /// `None`.
+    pub fn trap_code(&self) -> Option<TrapCode> {
+        match *self {
+            Self::CondTrap { code, .. }
+            | Self::FloatCondTrap { code, .. }
+            | Self::IntCondTrap { code, .. }
+            | Self::Trap { code, .. } => Some(code),
+            _ => None,
+        }
+    }
+
+    /// If this is a trapping instruction, get an exclusive reference to its
+    /// trap code. Otherwise, return `None`.
+    pub fn trap_code_mut(&mut self) -> Option<&mut TrapCode> {
+        match self {
+            Self::CondTrap { code, .. }
+            | Self::FloatCondTrap { code, .. }
+            | Self::IntCondTrap { code, .. }
+            | Self::Trap { code, .. } => Some(code),
+            _ => None,
+        }
+    }
+
     /// Return information about a call instruction.
     ///
     /// Any instruction that can call another function reveals its call signature here.
diff --git a/cranelift/codegen/src/lib.rs b/cranelift/codegen/src/lib.rs
index efe0ea00c6..3483219fea 100644
--- a/cranelift/codegen/src/lib.rs
+++ b/cranelift/codegen/src/lib.rs
@@ -115,6 +115,9 @@ mod topo_order;
 mod unreachable_code;
 mod value_label;
 
+#[cfg(feature = "enable-peepmatic")]
+mod peepmatic;
+
 pub use crate::result::{CodegenError, CodegenResult};
 
 /// Version number of this crate.
diff --git a/cranelift/codegen/src/peepmatic.rs b/cranelift/codegen/src/peepmatic.rs
new file mode 100644
index 0000000000..1ea2031bfa
--- /dev/null
+++ b/cranelift/codegen/src/peepmatic.rs
@@ -0,0 +1,887 @@
+//! Glue for working with `peepmatic`-generated peephole optimizers.
+
+use crate::cursor::{Cursor, FuncCursor};
+use crate::ir::{
+    dfg::DataFlowGraph,
+    entities::{Inst, Value},
+    immediates::{Imm64, Uimm64},
+    instructions::{InstructionData, Opcode},
+    types, InstBuilder,
+};
+use crate::isa::TargetIsa;
+use cranelift_codegen_shared::condcodes::IntCC;
+use peepmatic_runtime::{
+    cc::ConditionCode,
+    instruction_set::InstructionSet,
+    operator::Operator,
+    part::{Constant, Part},
+    paths::Path,
+    r#type::{BitWidth, Kind, Type},
+    PeepholeOptimizations, PeepholeOptimizer,
+};
+use std::boxed::Box;
+use std::convert::{TryFrom, TryInto};
+use std::ptr;
+use std::sync::atomic::{AtomicPtr, Ordering};
+
+/// Get the `preopt.peepmatic` peephole optimizer.
+pub(crate) fn preopt<'a, 'b>(
+    isa: &'b dyn TargetIsa,
+) -> PeepholeOptimizer<'static, 'a, &'b dyn TargetIsa> {
+    static SERIALIZED: &[u8] = include_bytes!("preopt.serialized");
+
+    // Once initialized, this must never be re-assigned. The initialized value
+    // is semantically "static data" and is intentionally leaked for the whole
+    // program's lifetime.
+    static DESERIALIZED: AtomicPtr<PeepholeOptimizations> = AtomicPtr::new(ptr::null_mut());
+
+    // If `DESERIALIZED` has already been initialized, then just use it.
+    let ptr = DESERIALIZED.load(Ordering::SeqCst);
+    if let Some(peep_opts) = unsafe { ptr.as_ref() } {
+        return peep_opts.optimizer(isa);
+    }
+
+    // Otherwise, if `DESERIALIZED` hasn't been initialized, then we need to
+    // deserialize the peephole optimizations and initialize it. However,
+    // another thread could be doing the same thing concurrently, so there is a
+    // race to see who initializes `DESERIALIZED` first, and we need to be
+    // prepared to both win or lose that race.
+    let peep_opts = PeepholeOptimizations::deserialize(SERIALIZED)
+        .expect("should always be able to deserialize `preopt.serialized`");
+    let peep_opts = Box::into_raw(Box::new(peep_opts));
+
+    // Only update `DESERIALIZE` if it is still null, attempting to perform the
+    // one-time transition from null -> non-null.
+    if DESERIALIZED
+        .compare_and_swap(ptr::null_mut(), peep_opts, Ordering::SeqCst)
+        .is_null()
+    {
+        // We won the race to initialize `DESERIALIZED`.
+        debug_assert_eq!(DESERIALIZED.load(Ordering::SeqCst), peep_opts);
+        let peep_opts = unsafe { &*peep_opts };
+        return peep_opts.optimizer(isa);
+    }
+
+    // We lost the race to initialize `DESERIALIZED`. Drop our no-longer-needed
+    // instance of `peep_opts` and get the pointer to the instance that won the
+    // race.
+    let _ = unsafe { Box::from_raw(peep_opts) };
+    let peep_opts = DESERIALIZED.load(Ordering::SeqCst);
+    let peep_opts = unsafe { peep_opts.as_ref().unwrap() };
+    peep_opts.optimizer(isa)
+}
+
+/// Either a `Value` or an `Inst`.
+#[derive(Clone, Copy, Debug, Eq, PartialEq)]
+pub enum ValueOrInst {
+    Value(Value),
+    Inst(Inst),
+}
+
+impl ValueOrInst {
+    /// Get the underlying `Value` if any.
+    pub fn value(&self) -> Option<Value> {
+        match *self {
+            Self::Value(v) => Some(v),
+            Self::Inst(_) => None,
+        }
+    }
+
+    /// Get the underlying `Inst` if any.
+    pub fn inst(&self) -> Option<Inst> {
+        match *self {
+            Self::Inst(i) => Some(i),
+            Self::Value(_) => None,
+        }
+    }
+
+    /// Unwrap the underlying `Value`, panicking if it is not a `Value.
+    pub fn unwrap_value(&self) -> Value {
+        self.value().unwrap()
+    }
+
+    /// Unwrap the underlying `Inst`, panicking if it is not a `Inst.
+    pub fn unwrap_inst(&self) -> Inst {
+        self.inst().unwrap()
+    }
+
+    /// Is this a `Value`?
+    pub fn is_value(&self) -> bool {
+        self.value().is_some()
+    }
+
+    /// Is this an `Inst`?
+    pub fn is_inst(&self) -> bool {
+        self.inst().is_some()
+    }
+
+    fn resolve_inst(&self, dfg: &DataFlowGraph) -> Option<Inst> {
+        match *self {
+            ValueOrInst::Inst(i) => Some(i),
+            ValueOrInst::Value(v) => dfg.value_def(v).inst(),
+        }
+    }
+
+    fn result_bit_width(&self, dfg: &DataFlowGraph) -> u8 {
+        match *self {
+            ValueOrInst::Value(v) => dfg.value_type(v).bits().try_into().unwrap(),
+            ValueOrInst::Inst(inst) => {
+                let result = dfg.first_result(inst);
+                dfg.value_type(result).bits().try_into().unwrap()
+            }
+        }
+    }
+
+    fn to_constant(&self, pos: &mut FuncCursor) -> Option<Constant> {
+        let inst = self.resolve_inst(&pos.func.dfg)?;
+        match pos.func.dfg[inst] {
+            InstructionData::UnaryImm {
+                opcode: Opcode::Iconst,
+                imm,
+            } => {
+                let width = self.result_bit_width(&pos.func.dfg).try_into().unwrap();
+                let x: i64 = imm.into();
+                Some(Constant::Int(x as u64, width))
+            }
+            InstructionData::UnaryBool {
+                opcode: Opcode::Bconst,
+                imm,
+            } => {
+                let width = self.result_bit_width(&pos.func.dfg).try_into().unwrap();
+                Some(Constant::Bool(imm, width))
+            }
+            _ => None,
+        }
+    }
+}
+
+impl From<Value> for ValueOrInst {
+    fn from(v: Value) -> ValueOrInst {
+        ValueOrInst::Value(v)
+    }
+}
+
+impl From<Inst> for ValueOrInst {
+    fn from(i: Inst) -> ValueOrInst {
+        ValueOrInst::Inst(i)
+    }
+}
+
+/// Get the fixed bit width of `bit_width`, or if it is polymorphic, the bit
+/// width of `root`.
+fn bit_width(dfg: &DataFlowGraph, bit_width: BitWidth, root: Inst) -> u8 {
+    bit_width.fixed_width().unwrap_or_else(|| {
+        let tyvar = dfg.ctrl_typevar(root);
+        let ty = dfg.compute_result_type(root, 0, tyvar).unwrap();
+        u8::try_from(ty.bits()).unwrap()
+    })
+}
+
+/// Convert the constant `c` into an instruction.
+fn const_to_value<'a>(builder: impl InstBuilder<'a>, c: Constant, root: Inst) -> Value {
+    match c {
+        Constant::Bool(b, width) => {
+            let width = bit_width(builder.data_flow_graph(), width, root);
+            let ty = match width {
+                1 => types::B1,
+                8 => types::B8,
+                16 => types::B16,
+                32 => types::B32,
+                64 => types::B64,
+                128 => types::B128,
+                _ => unreachable!(),
+            };
+            builder.bconst(ty, b)
+        }
+        Constant::Int(x, width) => {
+            let width = bit_width(builder.data_flow_graph(), width, root);
+            let ty = match width {
+                8 => types::I8,
+                16 => types::I16,
+                32 => types::I32,
+                64 => types::I64,
+                128 => types::I128,
+                _ => unreachable!(),
+            };
+            builder.iconst(ty, x as i64)
+        }
+    }
+}
+
+fn part_to_value(pos: &mut FuncCursor, root: Inst, part: Part<ValueOrInst>) -> Option<Value> {
+    match part {
+        Part::Instruction(ValueOrInst::Inst(inst)) => {
+            pos.func.dfg.inst_results(inst).first().copied()
+        }
+        Part::Instruction(ValueOrInst::Value(v)) => Some(v),
+        Part::Constant(c) => Some(const_to_value(pos.ins(), c, root)),
+        Part::ConditionCode(_) => None,
+    }
+}
+
+impl Opcode {
+    fn to_peepmatic_operator(&self) -> Option<Operator> {
+        macro_rules! convert {
+            ( $( $op:ident $(,)* )* ) => {
+                match self {
+                    $( Self::$op => Some(Operator::$op), )*
+                    _ => None,
+                }
+            }
+        }
+
+        convert!(
+            AdjustSpDown,
+            AdjustSpDownImm,
+            Band,
+            BandImm,
+            Bconst,
+            Bint,
+            Bor,
+            BorImm,
+            Brnz,
+            Brz,
+            Bxor,
+            BxorImm,
+            Iadd,
+            IaddImm,
+            Icmp,
+            IcmpImm,
+            Iconst,
+            Ifcmp,
+            IfcmpImm,
+            Imul,
+            ImulImm,
+            Ireduce,
+            IrsubImm,
+            Ishl,
+            IshlImm,
+            Isub,
+            Rotl,
+            RotlImm,
+            Rotr,
+            RotrImm,
+            Sdiv,
+            SdivImm,
+            Select,
+            Sextend,
+            Srem,
+            SremImm,
+            Sshr,
+            SshrImm,
+            Trapnz,
+            Trapz,
+            Udiv,
+            UdivImm,
+            Uextend,
+            Urem,
+            UremImm,
+            Ushr,
+            UshrImm,
+        )
+    }
+}
+
+impl TryFrom<Constant> for Imm64 {
+    type Error = &'static str;
+
+    fn try_from(c: Constant) -> Result<Self, Self::Error> {
+        match c {
+            Constant::Int(x, _) => Ok(Imm64::from(x as i64)),
+            Constant::Bool(..) => Err("cannot create Imm64 from Constant::Bool"),
+        }
+    }
+}
+
+impl Into<Constant> for Imm64 {
+    #[inline]
+    fn into(self) -> Constant {
+        let x: i64 = self.into();
+        Constant::Int(x as _, BitWidth::SixtyFour)
+    }
+}
+
+impl Into<Part<ValueOrInst>> for Imm64 {
+    #[inline]
+    fn into(self) -> Part<ValueOrInst> {
+        let c: Constant = self.into();
+        c.into()
+    }
+}
+
+fn part_to_imm64(pos: &mut FuncCursor, part: Part<ValueOrInst>) -> Imm64 {
+    return match part {
+        Part::Instruction(x) => match x.to_constant(pos).unwrap_or_else(|| cannot_convert()) {
+            Constant::Int(x, _) => (x as i64).into(),
+            Constant::Bool(..) => cannot_convert(),
+        },
+        Part::Constant(Constant::Int(x, _)) => (x as i64).into(),
+        Part::ConditionCode(_) | Part::Constant(Constant::Bool(..)) => cannot_convert(),
+    };
+
+    #[inline(never)]
+    #[cold]
+    fn cannot_convert() -> ! {
+        panic!("cannot convert part into `Imm64`")
+    }
+}
+
+impl Into<Constant> for Uimm64 {
+    #[inline]
+    fn into(self) -> Constant {
+        let x: u64 = self.into();
+        Constant::Int(x, BitWidth::SixtyFour)
+    }
+}
+
+impl Into<Part<ValueOrInst>> for Uimm64 {
+    #[inline]
+    fn into(self) -> Part<ValueOrInst> {
+        let c: Constant = self.into();
+        c.into()
+    }
+}
+
+fn peepmatic_to_intcc(cc: ConditionCode) -> IntCC {
+    match cc {
+        ConditionCode::Eq => IntCC::Equal,
+        ConditionCode::Ne => IntCC::NotEqual,
+        ConditionCode::Slt => IntCC::SignedLessThan,
+        ConditionCode::Sle => IntCC::SignedGreaterThanOrEqual,
+        ConditionCode::Sgt => IntCC::SignedGreaterThan,
+        ConditionCode::Sge => IntCC::SignedLessThanOrEqual,
+        ConditionCode::Ult => IntCC::UnsignedLessThan,
+        ConditionCode::Uge => IntCC::UnsignedGreaterThanOrEqual,
+        ConditionCode::Ugt => IntCC::UnsignedGreaterThan,
+        ConditionCode::Ule => IntCC::UnsignedLessThanOrEqual,
+        ConditionCode::Of => IntCC::Overflow,
+        ConditionCode::Nof => IntCC::NotOverflow,
+    }
+}
+
+fn intcc_to_peepmatic(cc: IntCC) -> ConditionCode {
+    match cc {
+        IntCC::Equal => ConditionCode::Eq,
+        IntCC::NotEqual => ConditionCode::Ne,
+        IntCC::SignedLessThan => ConditionCode::Slt,
+        IntCC::SignedGreaterThanOrEqual => ConditionCode::Sle,
+        IntCC::SignedGreaterThan => ConditionCode::Sgt,
+        IntCC::SignedLessThanOrEqual => ConditionCode::Sge,
+        IntCC::UnsignedLessThan => ConditionCode::Ult,
+        IntCC::UnsignedGreaterThanOrEqual => ConditionCode::Uge,
+        IntCC::UnsignedGreaterThan => ConditionCode::Ugt,
+        IntCC::UnsignedLessThanOrEqual => ConditionCode::Ule,
+        IntCC::Overflow => ConditionCode::Of,
+        IntCC::NotOverflow => ConditionCode::Nof,
+    }
+}
+
+fn get_immediate(dfg: &DataFlowGraph, inst: Inst, i: usize) -> Part<ValueOrInst> {
+    return match dfg[inst] {
+        InstructionData::BinaryImm { imm, .. } if i == 0 => imm.into(),
+        InstructionData::BranchIcmp { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::BranchInt { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::IntCompare { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::IntCompareImm { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::IntCompareImm { imm, .. } if i == 1 => imm.into(),
+        InstructionData::IntCond { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::IntCondTrap { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::IntSelect { cond, .. } if i == 0 => intcc_to_peepmatic(cond).into(),
+        InstructionData::UnaryBool { imm, .. } if i == 0 => {
+            Constant::Bool(imm, BitWidth::Polymorphic).into()
+        }
+        InstructionData::UnaryImm { imm, .. } if i == 0 => imm.into(),
+        ref otherwise => unsupported(otherwise),
+    };
+
+    #[inline(never)]
+    #[cold]
+    fn unsupported(data: &InstructionData) -> ! {
+        panic!("unsupported instruction data: {:?}", data)
+    }
+}
+
+fn get_argument(dfg: &DataFlowGraph, inst: Inst, i: usize) -> Option<Value> {
+    dfg.inst_args(inst).get(i).copied()
+}
+
+fn peepmatic_ty_to_ir_ty(ty: Type, dfg: &DataFlowGraph, root: Inst) -> types::Type {
+    match (ty.kind, bit_width(dfg, ty.bit_width, root)) {
+        (Kind::Int, 8) => types::I8,
+        (Kind::Int, 16) => types::I16,
+        (Kind::Int, 32) => types::I32,
+        (Kind::Int, 64) => types::I64,
+        (Kind::Int, 128) => types::I128,
+        (Kind::Bool, 1) => types::B1,
+        (Kind::Bool, 8) => types::I8,
+        (Kind::Bool, 16) => types::I16,
+        (Kind::Bool, 32) => types::I32,
+        (Kind::Bool, 64) => types::I64,
+        (Kind::Bool, 128) => types::I128,
+        _ => unreachable!(),
+    }
+}
+
+// NB: the unsafe contract we must uphold here is that our implementation of
+// `instruction_result_bit_width` must always return a valid, non-zero bit
+// width.
+unsafe impl<'a, 'b> InstructionSet<'b> for &'a dyn TargetIsa {
+    type Context = FuncCursor<'b>;
+
+    type Instruction = ValueOrInst;
+
+    fn replace_instruction(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        old: ValueOrInst,
+        new: Part<ValueOrInst>,
+    ) -> ValueOrInst {
+        log::trace!("replace {:?} with {:?}", old, new);
+        let old_inst = old.resolve_inst(&pos.func.dfg).unwrap();
+
+        // Try to convert `new` to an instruction, because we prefer replacing
+        // an old instruction with a new one wholesale. However, if the
+        // replacement cannot be converted to an instruction (e.g. the
+        // right-hand side is a block/function parameter value) then we change
+        // the old instruction's result to an alias of the new value.
+        let new_inst = match new {
+            Part::Instruction(ValueOrInst::Inst(inst)) => Some(inst),
+            Part::Instruction(ValueOrInst::Value(_)) => {
+                // Do not try and follow the value definition. If we transplant
+                // this value's instruction, and there are other uses of this
+                // value, then we could mess up ordering between instructions.
+                None
+            }
+            Part::Constant(c) => {
+                let v = const_to_value(pos.ins(), c, old_inst);
+                let inst = pos.func.dfg.value_def(v).unwrap_inst();
+                Some(inst)
+            }
+            Part::ConditionCode(_) => None,
+        };
+
+        match new_inst {
+            Some(new_inst) => {
+                pos.func.transplant_inst(old_inst, new_inst);
+                debug_assert_eq!(pos.current_inst(), Some(old_inst));
+                old_inst.into()
+            }
+            None => {
+                let new_value = part_to_value(pos, old_inst, new).unwrap();
+
+                let old_results = pos.func.dfg.detach_results(old_inst);
+                let old_results = old_results.as_slice(&pos.func.dfg.value_lists);
+                assert_eq!(old_results.len(), 1);
+                let old_value = old_results[0];
+
+                pos.func.dfg.change_to_alias(old_value, new_value);
+                pos.func.dfg.replace(old_inst).nop();
+
+                new_value.into()
+            }
+        }
+    }
+
+    fn get_part_at_path(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        root: ValueOrInst,
+        path: Path,
+    ) -> Option<Part<ValueOrInst>> {
+        // The root is path [0].
+        debug_assert!(!path.0.is_empty());
+        debug_assert_eq!(path.0[0], 0);
+
+        let mut part = Part::Instruction(root);
+        for p in path.0[1..].iter().copied() {
+            let inst = part.as_instruction()?.resolve_inst(&pos.func.dfg)?;
+            let operator = pos.func.dfg[inst].opcode().to_peepmatic_operator()?;
+
+            if p < operator.immediates_arity() {
+                part = get_immediate(&pos.func.dfg, inst, p as usize);
+                continue;
+            }
+
+            let arg = p - operator.immediates_arity();
+            let arg = arg as usize;
+            let value = get_argument(&pos.func.dfg, inst, arg)?;
+            part = Part::Instruction(value.into());
+        }
+
+        log::trace!("get_part_at_path({:?}) = {:?}", path, part);
+        Some(part)
+    }
+
+    fn operator(&self, pos: &mut FuncCursor<'b>, value_or_inst: ValueOrInst) -> Option<Operator> {
+        let inst = value_or_inst.resolve_inst(&pos.func.dfg)?;
+        pos.func.dfg[inst].opcode().to_peepmatic_operator()
+    }
+
+    fn make_inst_1(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        root: ValueOrInst,
+        operator: Operator,
+        r#type: Type,
+        a: Part<ValueOrInst>,
+    ) -> ValueOrInst {
+        log::trace!("make_inst_1: {:?}({:?})", operator, a);
+
+        let root = root.resolve_inst(&pos.func.dfg).unwrap();
+        match operator {
+            Operator::AdjustSpDown => {
+                let a = part_to_value(pos, root, a).unwrap();
+                pos.ins().adjust_sp_down(a).into()
+            }
+            Operator::AdjustSpDownImm => {
+                let c = a.unwrap_constant();
+                let imm = Imm64::try_from(c).unwrap();
+                pos.ins().adjust_sp_down_imm(imm).into()
+            }
+            Operator::Bconst => {
+                let c = a.unwrap_constant();
+                let val = const_to_value(pos.ins(), c, root);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Bint => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let ty = peepmatic_ty_to_ir_ty(r#type, &pos.func.dfg, root);
+                let val = pos.ins().bint(ty, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Brnz => {
+                let a = part_to_value(pos, root, a).unwrap();
+
+                // NB: branching instructions must be the root of an
+                // optimization's right-hand side, so we get the destination
+                // block and arguments from the left-hand side's root. Peepmatic
+                // doesn't currently represent labels or varargs.
+                let block = pos.func.dfg[root].branch_destination().unwrap();
+                let args = pos.func.dfg.inst_args(root)[1..].to_vec();
+
+                pos.ins().brnz(a, block, &args).into()
+            }
+            Operator::Brz => {
+                let a = part_to_value(pos, root, a).unwrap();
+
+                // See the comment in the `Operator::Brnz` match argm.
+                let block = pos.func.dfg[root].branch_destination().unwrap();
+                let args = pos.func.dfg.inst_args(root)[1..].to_vec();
+
+                pos.ins().brz(a, block, &args).into()
+            }
+            Operator::Iconst => {
+                let a = a.unwrap_constant();
+                let val = const_to_value(pos.ins(), a, root);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Ireduce => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let ty = peepmatic_ty_to_ir_ty(r#type, &pos.func.dfg, root);
+                let val = pos.ins().ireduce(ty, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Sextend => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let ty = peepmatic_ty_to_ir_ty(r#type, &pos.func.dfg, root);
+                let val = pos.ins().sextend(ty, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Trapnz => {
+                let a = part_to_value(pos, root, a).unwrap();
+
+                // NB: similar to branching instructions (see comment in the
+                // `Operator::Brnz` match arm) trapping instructions must be the
+                // root of an optimization's right-hand side, and we get the
+                // trap code from the root of the left-hand side. Peepmatic
+                // doesn't currently represent trap codes.
+                let code = pos.func.dfg[root].trap_code().unwrap();
+
+                pos.ins().trapnz(a, code).into()
+            }
+            Operator::Trapz => {
+                let a = part_to_value(pos, root, a).unwrap();
+                // See comment in the `Operator::Trapnz` match arm.
+                let code = pos.func.dfg[root].trap_code().unwrap();
+                pos.ins().trapz(a, code).into()
+            }
+            Operator::Uextend => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let ty = peepmatic_ty_to_ir_ty(r#type, &pos.func.dfg, root);
+                let val = pos.ins().uextend(ty, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            _ => unreachable!(),
+        }
+    }
+
+    fn make_inst_2(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        root: ValueOrInst,
+        operator: Operator,
+        _: Type,
+        a: Part<ValueOrInst>,
+        b: Part<ValueOrInst>,
+    ) -> ValueOrInst {
+        log::trace!("make_inst_2: {:?}({:?}, {:?})", operator, a, b);
+
+        let root = root.resolve_inst(&pos.func.dfg).unwrap();
+        match operator {
+            Operator::Band => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().band(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::BandImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().band_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Bor => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().bor(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::BorImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().bor_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Bxor => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().bxor(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::BxorImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().bxor_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Iadd => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().iadd(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::IaddImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().iadd_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Ifcmp => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ifcmp(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::IfcmpImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ifcmp_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Imul => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().imul(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::ImulImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().imul_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::IrsubImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().irsub_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Ishl => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ishl(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::IshlImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ishl_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Isub => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().isub(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Rotl => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().rotl(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::RotlImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().rotl_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Rotr => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().rotr(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::RotrImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().rotr_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Sdiv => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().sdiv(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::SdivImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().sdiv_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Srem => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().srem(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::SremImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().srem_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Sshr => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().sshr(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::SshrImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().sshr_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Udiv => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().udiv(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::UdivImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().udiv_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Urem => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().urem(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::UremImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().urem_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Ushr => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ushr(a, b);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::UshrImm => {
+                let a = part_to_imm64(pos, a);
+                let b = part_to_value(pos, root, b).unwrap();
+                let val = pos.ins().ushr_imm(b, a);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            _ => unreachable!(),
+        }
+    }
+
+    fn make_inst_3(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        root: ValueOrInst,
+        operator: Operator,
+        _: Type,
+        a: Part<ValueOrInst>,
+        b: Part<ValueOrInst>,
+        c: Part<ValueOrInst>,
+    ) -> ValueOrInst {
+        log::trace!("make_inst_3: {:?}({:?}, {:?}, {:?})", operator, a, b, c);
+
+        let root = root.resolve_inst(&pos.func.dfg).unwrap();
+        match operator {
+            Operator::Icmp => {
+                let cond = a.unwrap_condition_code();
+                let cond = peepmatic_to_intcc(cond);
+                let b = part_to_value(pos, root, b).unwrap();
+                let c = part_to_value(pos, root, c).unwrap();
+                let val = pos.ins().icmp(cond, b, c);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::IcmpImm => {
+                let cond = a.unwrap_condition_code();
+                let cond = peepmatic_to_intcc(cond);
+                let imm = part_to_imm64(pos, b);
+                let c = part_to_value(pos, root, c).unwrap();
+                let val = pos.ins().icmp_imm(cond, c, imm);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            Operator::Select => {
+                let a = part_to_value(pos, root, a).unwrap();
+                let b = part_to_value(pos, root, b).unwrap();
+                let c = part_to_value(pos, root, c).unwrap();
+                let val = pos.ins().select(a, b, c);
+                pos.func.dfg.value_def(val).unwrap_inst().into()
+            }
+            _ => unreachable!(),
+        }
+    }
+
+    fn instruction_to_constant(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        value_or_inst: ValueOrInst,
+    ) -> Option<Constant> {
+        value_or_inst.to_constant(pos)
+    }
+
+    fn instruction_result_bit_width(
+        &self,
+        pos: &mut FuncCursor<'b>,
+        value_or_inst: ValueOrInst,
+    ) -> u8 {
+        value_or_inst.result_bit_width(&pos.func.dfg)
+    }
+
+    fn native_word_size_in_bits(&self, _pos: &mut FuncCursor<'b>) -> u8 {
+        self.pointer_bits()
+    }
+}
diff --git a/cranelift/codegen/src/preopt.peepmatic b/cranelift/codegen/src/preopt.peepmatic
new file mode 100644
index 0000000000..604460dd57
--- /dev/null
+++ b/cranelift/codegen/src/preopt.peepmatic
@@ -0,0 +1,193 @@
+;; Apply basic simplifications.
+;;
+;; This folds constants with arithmetic to form `_imm` instructions, and other
+;; minor simplifications.
+;;
+;; Doesn't apply some simplifications if the native word width (in bytes) is
+;; smaller than the controlling type's width of the instruction. This would
+;; result in an illegal instruction that would likely be expanded back into an
+;; instruction on smaller types with the same initial opcode, creating
+;; unnecessary churn.
+
+;; Binary instructions whose second argument is constant.
+(=> (when (iadd $x $C)
+      (fits-in-native-word $C))
+    (iadd_imm $C $x))
+(=> (when (imul $x $C)
+      (fits-in-native-word $C))
+    (imul_imm $C $x))
+(=> (when (sdiv $x $C)
+      (fits-in-native-word $C))
+    (sdiv_imm $C $x))
+(=> (when (udiv $x $C)
+      (fits-in-native-word $C))
+    (udiv_imm $C $x))
+(=> (when (srem $x $C)
+      (fits-in-native-word $C))
+    (srem_imm $C $x))
+(=> (when (urem $x $C)
+      (fits-in-native-word $C))
+    (urem_imm $C $x))
+(=> (when (band $x $C)
+      (fits-in-native-word $C))
+    (band_imm $C $x))
+(=> (when (bor $x $C)
+      (fits-in-native-word $C))
+    (bor_imm $C $x))
+(=> (when (bxor $x $C)
+      (fits-in-native-word $C))
+    (bxor_imm $C $x))
+(=> (when (rotl $x $C)
+      (fits-in-native-word $C))
+    (rotl_imm $C $x))
+(=> (when (rotr $x $C)
+      (fits-in-native-word $C))
+    (rotr_imm $C $x))
+(=> (when (ishl $x $C)
+      (fits-in-native-word $C))
+    (ishl_imm $C $x))
+(=> (when (ushr $x $C)
+      (fits-in-native-word $C))
+    (ushr_imm $C $x))
+(=> (when (sshr $x $C)
+      (fits-in-native-word $C))
+    (sshr_imm $C $x))
+(=> (when (isub $x $C)
+      (fits-in-native-word $C))
+    (iadd_imm $(neg $C) $x))
+(=> (when (ifcmp $x $C)
+      (fits-in-native-word $C))
+    (ifcmp_imm $C $x))
+(=> (when (icmp $cond $x $C)
+      (fits-in-native-word $C))
+    (icmp_imm $cond $C $x))
+
+;; Binary instructions whose first operand is constant.
+(=> (when (iadd $C $x)
+      (fits-in-native-word $C))
+    (iadd_imm $C $x))
+(=> (when (imul $C $x)
+      (fits-in-native-word $C))
+    (imul_imm $C $x))
+(=> (when (band $C $x)
+      (fits-in-native-word $C))
+    (band_imm $C $x))
+(=> (when (bor $C $x)
+      (fits-in-native-word $C))
+    (bor_imm $C $x))
+(=> (when (bxor $C $x)
+      (fits-in-native-word $C))
+    (bxor_imm $C $x))
+(=> (when (isub $C $x)
+      (fits-in-native-word $C))
+    (irsub_imm $C $x))
+
+;; Unary instructions whose operand is constant.
+(=> (adjust_sp_down $C) (adjust_sp_down_imm $C))
+
+;; Fold `(binop_imm $C1 (binop_imm $C2 $x))` into `(binop_imm $(binop $C2 $C1) $x)`.
+(=> (iadd_imm $C1 (iadd_imm $C2 $x)) (iadd_imm $(iadd $C1 $C2) $x))
+(=> (imul_imm $C1 (imul_imm $C2 $x)) (imul_imm $(imul $C1 $C2) $x))
+(=> (bor_imm $C1 (bor_imm $C2 $x)) (bor_imm $(bor $C1 $C2) $x))
+(=> (band_imm $C1 (band_imm $C2 $x)) (band_imm $(band $C1 $C2) $x))
+(=> (bxor_imm $C1 (bxor_imm $C2 $x)) (bxor_imm $(bxor $C1 $C2) $x))
+
+;; Remove operations that are no-ops.
+(=> (iadd_imm 0 $x) $x)
+(=> (imul_imm 1 $x) $x)
+(=> (sdiv_imm 1 $x) $x)
+(=> (udiv_imm 1 $x) $x)
+(=> (bor_imm 0 $x) $x)
+(=> (band_imm -1 $x) $x)
+(=> (bxor_imm 0 $x) $x)
+(=> (rotl_imm 0 $x) $x)
+(=> (rotr_imm 0 $x) $x)
+(=> (ishl_imm 0 $x) $x)
+(=> (ushr_imm 0 $x) $x)
+(=> (sshr_imm 0 $x) $x)
+
+;; Replace with zero.
+(=> (imul_imm 0 $x) 0)
+(=> (band_imm 0 $x) 0)
+
+;; Replace with negative 1.
+(=> (bor_imm -1 $x) -1)
+
+;; Transform `[(x << N) >> N]` into a (un)signed-extending move.
+;;
+;; i16 -> i8 -> i16
+(=> (when (ushr_imm 8 (ishl_imm 8 $x))
+      (bit-width $x 16))
+    (uextend{i16} (ireduce{i8} $x)))
+(=> (when (sshr_imm 8 (ishl_imm 8 $x))
+      (bit-width $x 16))
+    (sextend{i16} (ireduce{i8} $x)))
+;; i32 -> i8 -> i32
+(=> (when (ushr_imm 24 (ishl_imm 24 $x))
+      (bit-width $x 32))
+    (uextend{i32} (ireduce{i8} $x)))
+(=> (when (sshr_imm 24 (ishl_imm 24 $x))
+      (bit-width $x 32))
+    (sextend{i32} (ireduce{i8} $x)))
+;; i32 -> i16 -> i32
+(=> (when (ushr_imm 16 (ishl_imm 16 $x))
+      (bit-width $x 32))
+    (uextend{i32} (ireduce{i16} $x)))
+(=> (when (sshr_imm 16 (ishl_imm 16 $x))
+      (bit-width $x 32))
+    (sextend{i32} (ireduce{i16} $x)))
+;; i64 -> i8 -> i64
+(=> (when (ushr_imm 56 (ishl_imm 56 $x))
+      (bit-width $x 64))
+    (uextend{i64} (ireduce{i8} $x)))
+(=> (when (sshr_imm 56 (ishl_imm 56 $x))
+      (bit-width $x 64))
+    (sextend{i64} (ireduce{i8} $x)))
+;; i64 -> i16 -> i64
+(=> (when (ushr_imm 48 (ishl_imm 48 $x))
+      (bit-width $x 64))
+    (uextend{i64} (ireduce{i16} $x)))
+(=> (when (sshr_imm 48 (ishl_imm 48 $x))
+      (bit-width $x 64))
+    (sextend{i64} (ireduce{i16} $x)))
+;; i64 -> i32 -> i64
+(=> (when (ushr_imm 32 (ishl_imm 32 $x))
+      (bit-width $x 64))
+    (uextend{i64} (ireduce{i32} $x)))
+(=> (when (sshr_imm 32 (ishl_imm 32 $x))
+      (bit-width $x 64))
+    (sextend{i64} (ireduce{i32} $x)))
+
+;; Fold away redundant `bint` instructions that accept both integer and boolean
+;; arguments.
+(=> (select (bint $x) $y $z) (select $x $y $z))
+(=> (brz (bint $x)) (brz $x))
+(=> (brnz (bint $x)) (brnz $x))
+(=> (trapz (bint $x)) (trapz $x))
+(=> (trapnz (bint $x)) (trapnz $x))
+
+;; Fold comparisons into branch operations when possible.
+;;
+;; This matches against operations which compare against zero, then use the
+;; result in a `brz` or `brnz` branch. It folds those two operations into a
+;; single `brz` or `brnz`.
+(=> (brnz (icmp_imm ne 0 $x)) (brnz $x))
+(=> (brz (icmp_imm ne 0 $x)) (brz $x))
+(=> (brnz (icmp_imm eq 0 $x)) (brz $x))
+(=> (brz (icmp_imm eq 0 $x)) (brnz $x))
+
+;; Division and remainder by constants.
+;;
+;; TODO: this section is incomplete, and a bunch of related optimizations are
+;; still hand-coded in `simple_preopt.rs`.
+
+;; (Division by one is handled above.)
+
+;; Remainder by one is zero.
+(=> (urem_imm 1 $x) 0)
+(=> (srem_imm 1 $x) 0)
+
+;; Division by a power of two -> shift right.
+(=> (when (udiv_imm $C $x)
+          (is-power-of-two $C))
+    (ushr_imm $(log2 $C) $x))
diff --git a/cranelift/codegen/src/preopt.serialized b/cranelift/codegen/src/preopt.serialized
new file mode 100644
index 0000000000..f016c6d32d
Binary files /dev/null and b/cranelift/codegen/src/preopt.serialized differ
diff --git a/cranelift/codegen/src/simple_preopt.rs b/cranelift/codegen/src/simple_preopt.rs
index 5090246cf1..2f47c7d91b 100644
--- a/cranelift/codegen/src/simple_preopt.rs
+++ b/cranelift/codegen/src/simple_preopt.rs
@@ -10,10 +10,8 @@ use crate::divconst_magic_numbers::{MS32, MS64, MU32, MU64};
 use crate::flowgraph::ControlFlowGraph;
 use crate::ir::{
     condcodes::{CondCode, IntCC},
-    dfg::ValueDef,
-    immediates,
-    instructions::{Opcode, ValueList},
-    types::{I16, I32, I64, I8},
+    instructions::Opcode,
+    types::{I32, I64},
     Block, DataFlowGraph, Function, Inst, InstBuilder, InstructionData, Type, Value,
 };
 use crate::isa::TargetIsa;
@@ -468,340 +466,6 @@ fn do_divrem_transformation(divrem_info: &DivRemByConstInfo, pos: &mut FuncCurso
     }
 }
 
-#[inline]
-fn resolve_imm64_value(dfg: &DataFlowGraph, value: Value) -> Option<immediates::Imm64> {
-    if let ValueDef::Result(candidate_inst, _) = dfg.value_def(value) {
-        if let InstructionData::UnaryImm {
-            opcode: Opcode::Iconst,
-            imm,
-        } = dfg[candidate_inst]
-        {
-            return Some(imm);
-        }
-    }
-    None
-}
-
-/// Try to transform [(x << N) >> N] into a (un)signed-extending move.
-/// Returns true if the final instruction has been converted to such a move.
-fn try_fold_extended_move(
-    pos: &mut FuncCursor,
-    inst: Inst,
-    opcode: Opcode,
-    arg: Value,
-    imm: immediates::Imm64,
-) -> bool {
-    if let ValueDef::Result(arg_inst, _) = pos.func.dfg.value_def(arg) {
-        if let InstructionData::BinaryImm {
-            opcode: Opcode::IshlImm,
-            arg: prev_arg,
-            imm: prev_imm,
-        } = &pos.func.dfg[arg_inst]
-        {
-            if imm != *prev_imm {
-                return false;
-            }
-
-            let dest_ty = pos.func.dfg.ctrl_typevar(inst);
-            if dest_ty != pos.func.dfg.ctrl_typevar(arg_inst) || !dest_ty.is_int() {
-                return false;
-            }
-
-            let imm_bits: i64 = imm.into();
-            let ireduce_ty = match (dest_ty.lane_bits() as i64).wrapping_sub(imm_bits) {
-                8 => I8,
-                16 => I16,
-                32 => I32,
-                _ => return false,
-            };
-            let ireduce_ty = ireduce_ty.by(dest_ty.lane_count()).unwrap();
-
-            // This becomes a no-op, since ireduce_ty has a smaller lane width than
-            // the argument type (also the destination type).
-            let arg = *prev_arg;
-            let narrower_arg = pos.ins().ireduce(ireduce_ty, arg);
-
-            if opcode == Opcode::UshrImm {
-                pos.func.dfg.replace(inst).uextend(dest_ty, narrower_arg);
-            } else {
-                pos.func.dfg.replace(inst).sextend(dest_ty, narrower_arg);
-            }
-            return true;
-        }
-    }
-    false
-}
-
-/// Apply basic simplifications.
-///
-/// This folds constants with arithmetic to form `_imm` instructions, and other minor
-/// simplifications.
-///
-/// Doesn't apply some simplifications if the native word width (in bytes) is smaller than the
-/// controlling type's width of the instruction. This would result in an illegal instruction that
-/// would likely be expanded back into an instruction on smaller types with the same initial
-/// opcode, creating unnecessary churn.
-fn simplify(pos: &mut FuncCursor, inst: Inst, native_word_width: u32) {
-    match pos.func.dfg[inst] {
-        InstructionData::Binary { opcode, args } => {
-            if let Some(mut imm) = resolve_imm64_value(&pos.func.dfg, args[1]) {
-                let new_opcode = match opcode {
-                    Opcode::Iadd => Opcode::IaddImm,
-                    Opcode::Imul => Opcode::ImulImm,
-                    Opcode::Sdiv => Opcode::SdivImm,
-                    Opcode::Udiv => Opcode::UdivImm,
-                    Opcode::Srem => Opcode::SremImm,
-                    Opcode::Urem => Opcode::UremImm,
-                    Opcode::Band => Opcode::BandImm,
-                    Opcode::Bor => Opcode::BorImm,
-                    Opcode::Bxor => Opcode::BxorImm,
-                    Opcode::Rotl => Opcode::RotlImm,
-                    Opcode::Rotr => Opcode::RotrImm,
-                    Opcode::Ishl => Opcode::IshlImm,
-                    Opcode::Ushr => Opcode::UshrImm,
-                    Opcode::Sshr => Opcode::SshrImm,
-                    Opcode::Isub => {
-                        imm = imm.wrapping_neg();
-                        Opcode::IaddImm
-                    }
-                    Opcode::Ifcmp => Opcode::IfcmpImm,
-                    _ => return,
-                };
-                let ty = pos.func.dfg.ctrl_typevar(inst);
-                if ty.bytes() <= native_word_width {
-                    pos.func
-                        .dfg
-                        .replace(inst)
-                        .BinaryImm(new_opcode, ty, imm, args[0]);
-
-                    // Repeat for BinaryImm simplification.
-                    simplify(pos, inst, native_word_width);
-                }
-            } else if let Some(imm) = resolve_imm64_value(&pos.func.dfg, args[0]) {
-                let new_opcode = match opcode {
-                    Opcode::Iadd => Opcode::IaddImm,
-                    Opcode::Imul => Opcode::ImulImm,
-                    Opcode::Band => Opcode::BandImm,
-                    Opcode::Bor => Opcode::BorImm,
-                    Opcode::Bxor => Opcode::BxorImm,
-                    Opcode::Isub => Opcode::IrsubImm,
-                    _ => return,
-                };
-                let ty = pos.func.dfg.ctrl_typevar(inst);
-                if ty.bytes() <= native_word_width {
-                    pos.func
-                        .dfg
-                        .replace(inst)
-                        .BinaryImm(new_opcode, ty, imm, args[1]);
-                }
-            }
-        }
-
-        InstructionData::Unary { opcode, arg } => {
-            if let Opcode::AdjustSpDown = opcode {
-                if let Some(imm) = resolve_imm64_value(&pos.func.dfg, arg) {
-                    // Note this works for both positive and negative immediate values.
-                    pos.func.dfg.replace(inst).adjust_sp_down_imm(imm);
-                }
-            }
-        }
-
-        InstructionData::BinaryImm { opcode, arg, imm } => {
-            let ty = pos.func.dfg.ctrl_typevar(inst);
-
-            let mut arg = arg;
-            let mut imm = imm;
-            match opcode {
-                Opcode::IaddImm
-                | Opcode::ImulImm
-                | Opcode::BorImm
-                | Opcode::BandImm
-                | Opcode::BxorImm => {
-                    // Fold binary_op(C2, binary_op(C1, x)) into binary_op(binary_op(C1, C2), x)
-                    if let ValueDef::Result(arg_inst, _) = pos.func.dfg.value_def(arg) {
-                        if let InstructionData::BinaryImm {
-                            opcode: prev_opcode,
-                            arg: prev_arg,
-                            imm: prev_imm,
-                        } = &pos.func.dfg[arg_inst]
-                        {
-                            if opcode == *prev_opcode && ty == pos.func.dfg.ctrl_typevar(arg_inst) {
-                                let lhs: i64 = imm.into();
-                                let rhs: i64 = (*prev_imm).into();
-                                let new_imm = match opcode {
-                                    Opcode::BorImm => lhs | rhs,
-                                    Opcode::BandImm => lhs & rhs,
-                                    Opcode::BxorImm => lhs ^ rhs,
-                                    Opcode::IaddImm => lhs.wrapping_add(rhs),
-                                    Opcode::ImulImm => lhs.wrapping_mul(rhs),
-                                    _ => panic!("can't happen"),
-                                };
-                                let new_imm = immediates::Imm64::from(new_imm);
-                                let new_arg = *prev_arg;
-                                pos.func
-                                    .dfg
-                                    .replace(inst)
-                                    .BinaryImm(opcode, ty, new_imm, new_arg);
-                                imm = new_imm;
-                                arg = new_arg;
-                            }
-                        }
-                    }
-                }
-
-                Opcode::UshrImm | Opcode::SshrImm => {
-                    if pos.func.dfg.ctrl_typevar(inst).bytes() <= native_word_width
-                        && try_fold_extended_move(pos, inst, opcode, arg, imm)
-                    {
-                        return;
-                    }
-                }
-
-                _ => {}
-            };
-
-            // Replace operations that are no-ops.
-            match (opcode, imm.into()) {
-                (Opcode::IaddImm, 0)
-                | (Opcode::ImulImm, 1)
-                | (Opcode::SdivImm, 1)
-                | (Opcode::UdivImm, 1)
-                | (Opcode::BorImm, 0)
-                | (Opcode::BandImm, -1)
-                | (Opcode::BxorImm, 0)
-                | (Opcode::RotlImm, 0)
-                | (Opcode::RotrImm, 0)
-                | (Opcode::IshlImm, 0)
-                | (Opcode::UshrImm, 0)
-                | (Opcode::SshrImm, 0) => {
-                    // Alias the result value with the original argument.
-                    replace_single_result_with_alias(&mut pos.func.dfg, inst, arg);
-                }
-                (Opcode::ImulImm, 0) | (Opcode::BandImm, 0) => {
-                    // Replace by zero.
-                    pos.func.dfg.replace(inst).iconst(ty, 0);
-                }
-                (Opcode::BorImm, -1) => {
-                    // Replace by minus one.
-                    pos.func.dfg.replace(inst).iconst(ty, -1);
-                }
-                _ => {}
-            }
-        }
-
-        InstructionData::IntCompare { opcode, cond, args } => {
-            debug_assert_eq!(opcode, Opcode::Icmp);
-            if let Some(imm) = resolve_imm64_value(&pos.func.dfg, args[1]) {
-                if pos.func.dfg.ctrl_typevar(inst).bytes() <= native_word_width {
-                    pos.func.dfg.replace(inst).icmp_imm(cond, args[0], imm);
-                }
-            }
-        }
-
-        InstructionData::CondTrap { .. }
-        | InstructionData::Branch { .. }
-        | InstructionData::Ternary {
-            opcode: Opcode::Select,
-            ..
-        } => {
-            // Fold away a redundant `bint`.
-            let condition_def = {
-                let args = pos.func.dfg.inst_args(inst);
-                pos.func.dfg.value_def(args[0])
-            };
-            if let ValueDef::Result(def_inst, _) = condition_def {
-                if let InstructionData::Unary {
-                    opcode: Opcode::Bint,
-                    arg: bool_val,
-                } = pos.func.dfg[def_inst]
-                {
-                    let args = pos.func.dfg.inst_args_mut(inst);
-                    args[0] = bool_val;
-                }
-            }
-        }
-
-        _ => {}
-    }
-}
-
-struct BranchOptInfo {
-    br_inst: Inst,
-    cmp_arg: Value,
-    args: ValueList,
-    new_opcode: Opcode,
-}
-
-/// Fold comparisons into branch operations when possible.
-///
-/// This matches against operations which compare against zero, then use the
-/// result in a `brz` or `brnz` branch. It folds those two operations into a
-/// single `brz` or `brnz`.
-fn branch_opt(pos: &mut FuncCursor, inst: Inst) {
-    let mut info = if let InstructionData::Branch {
-        opcode: br_opcode,
-        args: ref br_args,
-        ..
-    } = pos.func.dfg[inst]
-    {
-        let first_arg = {
-            let args = pos.func.dfg.inst_args(inst);
-            args[0]
-        };
-
-        let icmp_inst = if let ValueDef::Result(icmp_inst, _) = pos.func.dfg.value_def(first_arg) {
-            icmp_inst
-        } else {
-            return;
-        };
-
-        if let InstructionData::IntCompareImm {
-            opcode: Opcode::IcmpImm,
-            arg: cmp_arg,
-            cond: cmp_cond,
-            imm: cmp_imm,
-        } = pos.func.dfg[icmp_inst]
-        {
-            let cmp_imm: i64 = cmp_imm.into();
-            if cmp_imm != 0 {
-                return;
-            }
-
-            // icmp_imm returns non-zero when the comparison is true. So, if
-            // we're branching on zero, we need to invert the condition.
-            let cond = match br_opcode {
-                Opcode::Brz => cmp_cond.inverse(),
-                Opcode::Brnz => cmp_cond,
-                _ => return,
-            };
-
-            let new_opcode = match cond {
-                IntCC::Equal => Opcode::Brz,
-                IntCC::NotEqual => Opcode::Brnz,
-                _ => return,
-            };
-
-            BranchOptInfo {
-                br_inst: inst,
-                cmp_arg,
-                args: br_args.clone(),
-                new_opcode,
-            }
-        } else {
-            return;
-        }
-    } else {
-        return;
-    };
-
-    info.args.as_mut_slice(&mut pos.func.dfg.value_lists)[0] = info.cmp_arg;
-    if let InstructionData::Branch { ref mut opcode, .. } = pos.func.dfg[info.br_inst] {
-        *opcode = info.new_opcode;
-    } else {
-        panic!();
-    }
-}
-
 enum BranchOrderKind {
     BrzToBrnz(Value),
     BrnzToBrz(Value),
@@ -944,15 +608,427 @@ fn branch_order(pos: &mut FuncCursor, cfg: &mut ControlFlowGraph, block: Block,
     cfg.recompute_block(pos.func, block);
 }
 
+#[cfg(feature = "enable-peepmatic")]
+mod simplify {
+    use super::*;
+    use crate::peepmatic::ValueOrInst;
+
+    pub type PeepholeOptimizer<'a, 'b> =
+        peepmatic_runtime::optimizer::PeepholeOptimizer<'static, 'a, &'b dyn TargetIsa>;
+
+    pub fn peephole_optimizer<'a, 'b>(isa: &'b dyn TargetIsa) -> PeepholeOptimizer<'a, 'b> {
+        crate::peepmatic::preopt(isa)
+    }
+
+    pub fn apply_all<'a, 'b>(
+        optimizer: &mut PeepholeOptimizer<'a, 'b>,
+        pos: &mut FuncCursor<'a>,
+        inst: Inst,
+        _native_word_width: u32,
+    ) {
+        // After we apply one optimization, that might make another
+        // optimization applicable. Keep running the peephole optimizer
+        // until either:
+        //
+        // * No optimization applied, and therefore it doesn't make sense to
+        //   try again, because no optimization will apply again.
+        //
+        // * Or when we replaced an instruction with an alias to an existing
+        //   value, because we already ran the peephole optimizer over the
+        //   aliased value's instruction in an early part of the traversal
+        //   over the function.
+        while let Some(ValueOrInst::Inst(new_inst)) =
+            optimizer.apply_one(pos, ValueOrInst::Inst(inst))
+        {
+            // We transplanted a new instruction into the current
+            // instruction, so the "new" instruction is actually the same
+            // one, just with different data.
+            debug_assert_eq!(new_inst, inst);
+        }
+        debug_assert_eq!(pos.current_inst(), Some(inst));
+    }
+}
+
+#[cfg(not(feature = "enable-peepmatic"))]
+mod simplify {
+    use super::*;
+    use crate::ir::{
+        dfg::ValueDef,
+        immediates,
+        instructions::{Opcode, ValueList},
+        types::{I16, I32, I8},
+    };
+    use std::marker::PhantomData;
+
+    pub struct PeepholeOptimizer<'a, 'b> {
+        phantom: PhantomData<(&'a (), &'b ())>,
+    }
+
+    pub fn peephole_optimizer<'a, 'b>(_: &dyn TargetIsa) -> PeepholeOptimizer<'a, 'b> {
+        PeepholeOptimizer {
+            phantom: PhantomData,
+        }
+    }
+
+    pub fn apply_all<'a, 'b>(
+        _optimizer: &mut PeepholeOptimizer<'a, 'b>,
+        pos: &mut FuncCursor<'a>,
+        inst: Inst,
+        native_word_width: u32,
+    ) {
+        simplify(pos, inst, native_word_width);
+        branch_opt(pos, inst);
+    }
+
+    #[inline]
+    fn resolve_imm64_value(dfg: &DataFlowGraph, value: Value) -> Option<immediates::Imm64> {
+        if let ValueDef::Result(candidate_inst, _) = dfg.value_def(value) {
+            if let InstructionData::UnaryImm {
+                opcode: Opcode::Iconst,
+                imm,
+            } = dfg[candidate_inst]
+            {
+                return Some(imm);
+            }
+        }
+        None
+    }
+
+    /// Try to transform [(x << N) >> N] into a (un)signed-extending move.
+    /// Returns true if the final instruction has been converted to such a move.
+    fn try_fold_extended_move(
+        pos: &mut FuncCursor,
+        inst: Inst,
+        opcode: Opcode,
+        arg: Value,
+        imm: immediates::Imm64,
+    ) -> bool {
+        if let ValueDef::Result(arg_inst, _) = pos.func.dfg.value_def(arg) {
+            if let InstructionData::BinaryImm {
+                opcode: Opcode::IshlImm,
+                arg: prev_arg,
+                imm: prev_imm,
+            } = &pos.func.dfg[arg_inst]
+            {
+                if imm != *prev_imm {
+                    return false;
+                }
+
+                let dest_ty = pos.func.dfg.ctrl_typevar(inst);
+                if dest_ty != pos.func.dfg.ctrl_typevar(arg_inst) || !dest_ty.is_int() {
+                    return false;
+                }
+
+                let imm_bits: i64 = imm.into();
+                let ireduce_ty = match (dest_ty.lane_bits() as i64).wrapping_sub(imm_bits) {
+                    8 => I8,
+                    16 => I16,
+                    32 => I32,
+                    _ => return false,
+                };
+                let ireduce_ty = ireduce_ty.by(dest_ty.lane_count()).unwrap();
+
+                // This becomes a no-op, since ireduce_ty has a smaller lane width than
+                // the argument type (also the destination type).
+                let arg = *prev_arg;
+                let narrower_arg = pos.ins().ireduce(ireduce_ty, arg);
+
+                if opcode == Opcode::UshrImm {
+                    pos.func.dfg.replace(inst).uextend(dest_ty, narrower_arg);
+                } else {
+                    pos.func.dfg.replace(inst).sextend(dest_ty, narrower_arg);
+                }
+                return true;
+            }
+        }
+        false
+    }
+
+    /// Apply basic simplifications.
+    ///
+    /// This folds constants with arithmetic to form `_imm` instructions, and other minor
+    /// simplifications.
+    ///
+    /// Doesn't apply some simplifications if the native word width (in bytes) is smaller than the
+    /// controlling type's width of the instruction. This would result in an illegal instruction that
+    /// would likely be expanded back into an instruction on smaller types with the same initial
+    /// opcode, creating unnecessary churn.
+    fn simplify(pos: &mut FuncCursor, inst: Inst, native_word_width: u32) {
+        match pos.func.dfg[inst] {
+            InstructionData::Binary { opcode, args } => {
+                if let Some(mut imm) = resolve_imm64_value(&pos.func.dfg, args[1]) {
+                    let new_opcode = match opcode {
+                        Opcode::Iadd => Opcode::IaddImm,
+                        Opcode::Imul => Opcode::ImulImm,
+                        Opcode::Sdiv => Opcode::SdivImm,
+                        Opcode::Udiv => Opcode::UdivImm,
+                        Opcode::Srem => Opcode::SremImm,
+                        Opcode::Urem => Opcode::UremImm,
+                        Opcode::Band => Opcode::BandImm,
+                        Opcode::Bor => Opcode::BorImm,
+                        Opcode::Bxor => Opcode::BxorImm,
+                        Opcode::Rotl => Opcode::RotlImm,
+                        Opcode::Rotr => Opcode::RotrImm,
+                        Opcode::Ishl => Opcode::IshlImm,
+                        Opcode::Ushr => Opcode::UshrImm,
+                        Opcode::Sshr => Opcode::SshrImm,
+                        Opcode::Isub => {
+                            imm = imm.wrapping_neg();
+                            Opcode::IaddImm
+                        }
+                        Opcode::Ifcmp => Opcode::IfcmpImm,
+                        _ => return,
+                    };
+                    let ty = pos.func.dfg.ctrl_typevar(inst);
+                    if ty.bytes() <= native_word_width {
+                        pos.func
+                            .dfg
+                            .replace(inst)
+                            .BinaryImm(new_opcode, ty, imm, args[0]);
+
+                        // Repeat for BinaryImm simplification.
+                        simplify(pos, inst, native_word_width);
+                    }
+                } else if let Some(imm) = resolve_imm64_value(&pos.func.dfg, args[0]) {
+                    let new_opcode = match opcode {
+                        Opcode::Iadd => Opcode::IaddImm,
+                        Opcode::Imul => Opcode::ImulImm,
+                        Opcode::Band => Opcode::BandImm,
+                        Opcode::Bor => Opcode::BorImm,
+                        Opcode::Bxor => Opcode::BxorImm,
+                        Opcode::Isub => Opcode::IrsubImm,
+                        _ => return,
+                    };
+                    let ty = pos.func.dfg.ctrl_typevar(inst);
+                    if ty.bytes() <= native_word_width {
+                        pos.func
+                            .dfg
+                            .replace(inst)
+                            .BinaryImm(new_opcode, ty, imm, args[1]);
+                    }
+                }
+            }
+
+            InstructionData::Unary { opcode, arg } => {
+                if let Opcode::AdjustSpDown = opcode {
+                    if let Some(imm) = resolve_imm64_value(&pos.func.dfg, arg) {
+                        // Note this works for both positive and negative immediate values.
+                        pos.func.dfg.replace(inst).adjust_sp_down_imm(imm);
+                    }
+                }
+            }
+
+            InstructionData::BinaryImm { opcode, arg, imm } => {
+                let ty = pos.func.dfg.ctrl_typevar(inst);
+
+                let mut arg = arg;
+                let mut imm = imm;
+                match opcode {
+                    Opcode::IaddImm
+                    | Opcode::ImulImm
+                    | Opcode::BorImm
+                    | Opcode::BandImm
+                    | Opcode::BxorImm => {
+                        // Fold binary_op(C2, binary_op(C1, x)) into binary_op(binary_op(C1, C2), x)
+                        if let ValueDef::Result(arg_inst, _) = pos.func.dfg.value_def(arg) {
+                            if let InstructionData::BinaryImm {
+                                opcode: prev_opcode,
+                                arg: prev_arg,
+                                imm: prev_imm,
+                            } = &pos.func.dfg[arg_inst]
+                            {
+                                if opcode == *prev_opcode
+                                    && ty == pos.func.dfg.ctrl_typevar(arg_inst)
+                                {
+                                    let lhs: i64 = imm.into();
+                                    let rhs: i64 = (*prev_imm).into();
+                                    let new_imm = match opcode {
+                                        Opcode::BorImm => lhs | rhs,
+                                        Opcode::BandImm => lhs & rhs,
+                                        Opcode::BxorImm => lhs ^ rhs,
+                                        Opcode::IaddImm => lhs.wrapping_add(rhs),
+                                        Opcode::ImulImm => lhs.wrapping_mul(rhs),
+                                        _ => panic!("can't happen"),
+                                    };
+                                    let new_imm = immediates::Imm64::from(new_imm);
+                                    let new_arg = *prev_arg;
+                                    pos.func
+                                        .dfg
+                                        .replace(inst)
+                                        .BinaryImm(opcode, ty, new_imm, new_arg);
+                                    imm = new_imm;
+                                    arg = new_arg;
+                                }
+                            }
+                        }
+                    }
+
+                    Opcode::UshrImm | Opcode::SshrImm => {
+                        if pos.func.dfg.ctrl_typevar(inst).bytes() <= native_word_width
+                            && try_fold_extended_move(pos, inst, opcode, arg, imm)
+                        {
+                            return;
+                        }
+                    }
+
+                    _ => {}
+                };
+
+                // Replace operations that are no-ops.
+                match (opcode, imm.into()) {
+                    (Opcode::IaddImm, 0)
+                    | (Opcode::ImulImm, 1)
+                    | (Opcode::SdivImm, 1)
+                    | (Opcode::UdivImm, 1)
+                    | (Opcode::BorImm, 0)
+                    | (Opcode::BandImm, -1)
+                    | (Opcode::BxorImm, 0)
+                    | (Opcode::RotlImm, 0)
+                    | (Opcode::RotrImm, 0)
+                    | (Opcode::IshlImm, 0)
+                    | (Opcode::UshrImm, 0)
+                    | (Opcode::SshrImm, 0) => {
+                        // Alias the result value with the original argument.
+                        replace_single_result_with_alias(&mut pos.func.dfg, inst, arg);
+                    }
+                    (Opcode::ImulImm, 0) | (Opcode::BandImm, 0) => {
+                        // Replace by zero.
+                        pos.func.dfg.replace(inst).iconst(ty, 0);
+                    }
+                    (Opcode::BorImm, -1) => {
+                        // Replace by minus one.
+                        pos.func.dfg.replace(inst).iconst(ty, -1);
+                    }
+                    _ => {}
+                }
+            }
+
+            InstructionData::IntCompare { opcode, cond, args } => {
+                debug_assert_eq!(opcode, Opcode::Icmp);
+                if let Some(imm) = resolve_imm64_value(&pos.func.dfg, args[1]) {
+                    if pos.func.dfg.ctrl_typevar(inst).bytes() <= native_word_width {
+                        pos.func.dfg.replace(inst).icmp_imm(cond, args[0], imm);
+                    }
+                }
+            }
+
+            InstructionData::CondTrap { .. }
+            | InstructionData::Branch { .. }
+            | InstructionData::Ternary {
+                opcode: Opcode::Select,
+                ..
+            } => {
+                // Fold away a redundant `bint`.
+                let condition_def = {
+                    let args = pos.func.dfg.inst_args(inst);
+                    pos.func.dfg.value_def(args[0])
+                };
+                if let ValueDef::Result(def_inst, _) = condition_def {
+                    if let InstructionData::Unary {
+                        opcode: Opcode::Bint,
+                        arg: bool_val,
+                    } = pos.func.dfg[def_inst]
+                    {
+                        let args = pos.func.dfg.inst_args_mut(inst);
+                        args[0] = bool_val;
+                    }
+                }
+            }
+
+            _ => {}
+        }
+    }
+
+    struct BranchOptInfo {
+        br_inst: Inst,
+        cmp_arg: Value,
+        args: ValueList,
+        new_opcode: Opcode,
+    }
+
+    /// Fold comparisons into branch operations when possible.
+    ///
+    /// This matches against operations which compare against zero, then use the
+    /// result in a `brz` or `brnz` branch. It folds those two operations into a
+    /// single `brz` or `brnz`.
+    fn branch_opt(pos: &mut FuncCursor, inst: Inst) {
+        let mut info = if let InstructionData::Branch {
+            opcode: br_opcode,
+            args: ref br_args,
+            ..
+        } = pos.func.dfg[inst]
+        {
+            let first_arg = {
+                let args = pos.func.dfg.inst_args(inst);
+                args[0]
+            };
+
+            let icmp_inst =
+                if let ValueDef::Result(icmp_inst, _) = pos.func.dfg.value_def(first_arg) {
+                    icmp_inst
+                } else {
+                    return;
+                };
+
+            if let InstructionData::IntCompareImm {
+                opcode: Opcode::IcmpImm,
+                arg: cmp_arg,
+                cond: cmp_cond,
+                imm: cmp_imm,
+            } = pos.func.dfg[icmp_inst]
+            {
+                let cmp_imm: i64 = cmp_imm.into();
+                if cmp_imm != 0 {
+                    return;
+                }
+
+                // icmp_imm returns non-zero when the comparison is true. So, if
+                // we're branching on zero, we need to invert the condition.
+                let cond = match br_opcode {
+                    Opcode::Brz => cmp_cond.inverse(),
+                    Opcode::Brnz => cmp_cond,
+                    _ => return,
+                };
+
+                let new_opcode = match cond {
+                    IntCC::Equal => Opcode::Brz,
+                    IntCC::NotEqual => Opcode::Brnz,
+                    _ => return,
+                };
+
+                BranchOptInfo {
+                    br_inst: inst,
+                    cmp_arg,
+                    args: br_args.clone(),
+                    new_opcode,
+                }
+            } else {
+                return;
+            }
+        } else {
+            return;
+        };
+
+        info.args.as_mut_slice(&mut pos.func.dfg.value_lists)[0] = info.cmp_arg;
+        if let InstructionData::Branch { ref mut opcode, .. } = pos.func.dfg[info.br_inst] {
+            *opcode = info.new_opcode;
+        } else {
+            panic!();
+        }
+    }
+}
+
 /// The main pre-opt pass.
 pub fn do_preopt(func: &mut Function, cfg: &mut ControlFlowGraph, isa: &dyn TargetIsa) {
     let _tt = timing::preopt();
+
     let mut pos = FuncCursor::new(func);
-    let native_word_width = isa.pointer_bytes();
+    let native_word_width = isa.pointer_bytes() as u32;
+    let mut optimizer = simplify::peephole_optimizer(isa);
+
     while let Some(block) = pos.next_block() {
         while let Some(inst) = pos.next_inst() {
-            // Apply basic simplifications.
-            simplify(&mut pos, inst, native_word_width as u32);
+            simplify::apply_all(&mut optimizer, &mut pos, inst, native_word_width);
 
             // Try to transform divide-by-constant into simpler operations.
             if let Some(divrem_info) = get_div_info(inst, &pos.func.dfg) {
@@ -960,7 +1036,6 @@ pub fn do_preopt(func: &mut Function, cfg: &mut ControlFlowGraph, isa: &dyn Targ
                 continue;
             }
 
-            branch_opt(&mut pos, inst);
             branch_order(&mut pos, cfg, block, inst);
         }
     }
diff --git a/cranelift/filetests/Cargo.toml b/cranelift/filetests/Cargo.toml
index 481401cf8a..705c31fc61 100644
--- a/cranelift/filetests/Cargo.toml
+++ b/cranelift/filetests/Cargo.toml
@@ -26,3 +26,6 @@ num_cpus = "1.8.0"
 region = "2.1.2"
 target-lexicon = "0.10"
 thiserror = "1.0.15"
+
+[features]
+enable-peepmatic = []
diff --git a/cranelift/filetests/filetests/isa/x86/isub_imm-i8.clif b/cranelift/filetests/filetests/isa/x86/isub_imm-i8.clif
index 018ac95fbc..dcf6c77e9a 100644
--- a/cranelift/filetests/filetests/isa/x86/isub_imm-i8.clif
+++ b/cranelift/filetests/filetests/isa/x86/isub_imm-i8.clif
@@ -6,9 +6,9 @@ function u0:0(i8) -> i8 fast {
 block0(v0: i8):
     v1 = iconst.i8 0
     v2 = isub v1, v0
-    ; check: v3 = uextend.i32 v0
-    ; nextln: v5 = iconst.i32 0
-    ; nextln = isub v5, v3
-    ; nextln = ireduce.i8 v4
+    ; check:  uextend.i32
+    ; nextln: iconst.i32
+    ; nextln: isub
+    ; nextln: ireduce.i8
     return v2
 }
diff --git a/cranelift/filetests/filetests/peepmatic/branch.clif b/cranelift/filetests/filetests/peepmatic/branch.clif
new file mode 100644
index 0000000000..0f68bbe9cb
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/branch.clif
@@ -0,0 +1,81 @@
+test peepmatic
+target x86_64
+
+function %icmp_to_brz_fold(i32) -> i32 {
+block0(v0: i32):
+    v1 = icmp_imm eq v0, 0
+    brnz v1, block1
+    jump block2
+block1:
+    v3 = iconst.i32 1
+    return v3
+block2:
+    v4 = iconst.i32 2
+    return v4
+}
+; sameln: function %icmp_to_brz_fold
+; nextln: block0(v0: i32):
+; nextln:     v1 = icmp_imm eq v0, 0
+; nextln:     brnz v0, block2
+; nextln:     jump block1
+; nextln: 
+; nextln: block1:
+; nextln:     v3 = iconst.i32 1
+; nextln:     return v3
+; nextln: 
+; nextln: block2:
+; nextln:     v4 = iconst.i32 2
+; nextln:     return v4
+; nextln: }
+
+function %icmp_to_brz_inverted_fold(i32) -> i32 {
+block0(v0: i32):
+    v1 = icmp_imm ne v0, 0
+    brz v1, block1
+    jump block2
+block1:
+    v3 = iconst.i32 1
+    return v3
+block2:
+    v4 = iconst.i32 2
+    return v4
+}
+; sameln: function %icmp_to_brz_inve
+; nextln: block0(v0: i32):
+; nextln:     v1 = icmp_imm ne v0, 0
+; nextln:     brnz v0, block2
+; nextln:     jump block1
+; nextln: 
+; nextln: block1:
+; nextln:     v3 = iconst.i32 1
+; nextln:     return v3
+; nextln: 
+; nextln: block2:
+; nextln:     v4 = iconst.i32 2
+; nextln:     return v4
+; nextln: }
+
+function %br_icmp_inversion(i32, i32) -> i32 {
+block0(v0: i32, v1: i32):
+    br_icmp ugt v0, v1, block1
+    jump block2
+block1:
+    v2 = iconst.i32 1
+    return v2
+block2:
+    v3 = iconst.i32 2
+    return v3
+}
+; sameln: function %br_icmp_inversio
+; nextln: block0(v0: i32, v1: i32):
+; nextln:     br_icmp ule v0, v1, block2
+; nextln:     jump block1
+; nextln: 
+; nextln: block1:
+; nextln:     v2 = iconst.i32 1
+; nextln:     return v2
+; nextln: 
+; nextln: block2:
+; nextln:     v3 = iconst.i32 2
+; nextln:     return v3
+; nextln: }
diff --git a/cranelift/filetests/filetests/peepmatic/div_by_const_indirect.clif b/cranelift/filetests/filetests/peepmatic/div_by_const_indirect.clif
new file mode 100644
index 0000000000..ba65b2418c
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/div_by_const_indirect.clif
@@ -0,0 +1,55 @@
+test peepmatic
+target x86_64 baseline
+
+; Cases where the denominator is created by an iconst
+
+function %indir_udiv32(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 7
+    v2 = udiv v0, v1
+    ; check:  v4 = iconst.i32 0x2492_4925
+    ; nextln: v5 = umulhi v0, v4
+    ; nextln: v6 = isub v0, v5
+    ; nextln: v7 = ushr_imm v6, 1
+    ; nextln: v8 = iadd v7, v5
+    ; nextln: v9 = ushr_imm v8, 2
+    ; nextln: v2 -> v9
+    return v2
+}
+
+function %indir_sdiv32(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 -17
+    v2 = sdiv v0, v1
+    ; check:  v4 = iconst.i32 0xffff_ffff_8787_8787
+    ; nextln: v5 = smulhi v0, v4
+    ; nextln: v6 = sshr_imm v5, 3
+    ; nextln: v7 = ushr_imm v6, 31
+    ; nextln: v8 = iadd v6, v7
+    ; nextln: v2 -> v8
+    return v2
+}
+
+function %indir_udiv64(i64) -> i64 {
+block0(v0: i64):
+    v1 = iconst.i64 1337
+    v2 = udiv v0, v1
+    ; check:  v4 = iconst.i64 0xc411_9d95_2866_a139
+    ; nextln: v5 = umulhi v0, v4
+    ; nextln: v6 = ushr_imm v5, 10
+    ; nextln: v2 -> v6
+    return v2
+}
+
+function %indir_sdiv64(i64) -> i64 {
+block0(v0: i64):
+    v1 = iconst.i64 -90210
+    v2 = sdiv v0, v1
+    ; check:  v4 = iconst.i64 0xd181_4ee8_939c_b8bb
+    ; nextln: v5 = smulhi v0, v4
+    ; nextln: v6 = sshr_imm v5, 14
+    ; nextln: v7 = ushr_imm v6, 63
+    ; nextln: v8 = iadd v6, v7
+    ; nextln: v2 -> v8
+    return v2
+}
diff --git a/cranelift/filetests/filetests/peepmatic/div_by_const_non_power_of_2.clif b/cranelift/filetests/filetests/peepmatic/div_by_const_non_power_of_2.clif
new file mode 100644
index 0000000000..0759f92ca9
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/div_by_const_non_power_of_2.clif
@@ -0,0 +1,266 @@
+test peepmatic
+target i686 baseline
+
+; -------- U32 --------
+
+; complex case (mul, sub, shift, add, shift)
+function %t_udiv32_p7(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 7
+    ; check: iconst.i32 0x2492_4925
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: v7 = ushr_imm v6, 2
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case (mul, shift)
+function %t_udiv32_p125(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 125
+    ; check: iconst.i32 0x1062_4dd3
+    ; check: umulhi v0, v2
+    ; check: v4 = ushr_imm v3, 3
+    ; check: v1 -> v4
+    return v1
+}
+
+; simple case w/ shift by zero (mul)
+function %t_udiv32_p641(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 641
+    ; check: iconst.i32 0x0066_3d81
+    ; check: v3 = umulhi v0, v2
+    ; check: v1 -> v3
+    return v1
+}
+
+
+; -------- S32 --------
+
+; simple case w/ shift by zero (mul, add-sign-bit)
+function %t_sdiv32_n6(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -6
+    ; check: iconst.i32 0xffff_ffff_d555_5555
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 31
+    ; check: v5 = iadd v3, v4
+    ; check: v1 -> v5
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_sdiv32_n5(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -5
+    ; check: iconst.i32 0xffff_ffff_9999_9999
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: ushr_imm v4, 31
+    ; check: v6 = iadd v4, v5
+    ; check: v1 -> v6
+    return v1
+}
+
+; case d < 0 && M > 0 (mul, sub, shift, add-sign-bit)
+function %t_sdiv32_n3(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -3
+    ; check: iconst.i32 0x5555_5555
+    ; check: smulhi v0, v2
+    ; check: isub v3, v0
+    ; check: sshr_imm v4, 1
+    ; check: ushr_imm v5, 31
+    ; check: v7 = iadd v5, v6
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case w/ shift by zero (mul, add-sign-bit)
+function %t_sdiv32_p6(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 6
+    ; check: iconst.i32 0x2aaa_aaab
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 31
+    ; check: v5 = iadd v3, v4
+    ; check: v1 -> v5
+    return v1
+}
+
+; case d > 0 && M < 0 (mull, add, shift, add-sign-bit)
+function %t_sdiv32_p7(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 7
+    ; check: iconst.i32 0xffff_ffff_9249_2493
+    ; check: smulhi v0, v2
+    ; check: iadd v3, v0
+    ; check: sshr_imm v4, 2
+    ; check: ushr_imm v5, 31
+    ; check: v7 = iadd v5, v6
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_sdiv32_p625(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 625
+    ; check: iconst.i32 0x68db_8bad
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 8
+    ; check: ushr_imm v4, 31
+    ; check: v6 = iadd v4, v5
+    ; check: v1 -> v6
+    return v1
+}
+
+
+; -------- U64 --------
+
+; complex case (mul, sub, shift, add, shift)
+function %t_udiv64_p7(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 7
+    ; check: iconst.i64 0x2492_4924_9249_2493
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: v7 = ushr_imm v6, 2
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case (mul, shift)
+function %t_udiv64_p9(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 9
+    ; check: iconst.i64 0xe38e_38e3_8e38_e38f
+    ; check: umulhi v0, v2
+    ; check: v4 = ushr_imm v3, 3
+    ; check: v1 -> v4
+    return v1
+}
+
+; complex case (mul, sub, shift, add, shift)
+function %t_udiv64_p125(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 125
+    ; check: iconst.i64 0x0624_dd2f_1a9f_be77
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: v7 = ushr_imm v6, 6
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case w/ shift by zero (mul)
+function %t_udiv64_p274177(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 274177
+    ; check: iconst.i64 0x3d30_f19c_d101
+    ; check: v3 = umulhi v0, v2
+    ; check: v1 -> v3
+    return v1
+}
+
+
+; -------- S64 --------
+
+; simple case (mul, shift, add-sign-bit)
+function %t_sdiv64_n625(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -625
+    ; check: iconst.i64 0xcb92_3a29_c779_a6b5
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 7
+    ; check: ushr_imm v4, 63
+    ; check: v6 = iadd v4, v5
+    ; check: v1 -> v6
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_sdiv64_n6(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -6
+    ; check: iconst.i64 0xd555_5555_5555_5555
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 63
+    ; check: v5 = iadd v3, v4
+    ; check: v1 -> v5
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_sdiv64_n5(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -5
+    ; check: iconst.i64 0x9999_9999_9999_9999
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: ushr_imm v4, 63
+    ; check: v6 = iadd v4, v5
+    ; check: v1 -> v6
+    return v1
+}
+
+; case d < 0 && M > 0 (mul, sub, shift, add-sign-bit)
+function %t_sdiv64_n3(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -3
+    ; check: iconst.i64 0x5555_5555_5555_5555
+    ; check: smulhi v0, v2
+    ; check: isub v3, v0
+    ; check: sshr_imm v4, 1
+    ; check: ushr_imm v5, 63
+    ; check: v7 = iadd v5, v6
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_sdiv64_p6(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 6
+    ; check: iconst.i64 0x2aaa_aaaa_aaaa_aaab
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 63
+    ; check: v5 = iadd v3, v4
+    ; check: v1 -> v5
+    return v1
+}
+
+; case d > 0 && M < 0 (mul, add, shift, add-sign-bit)
+function %t_sdiv64_p15(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 15
+    ; check: iconst.i64 0x8888_8888_8888_8889
+    ; check: smulhi v0, v2
+    ; check: iadd v3, v0
+    ; check: sshr_imm v4, 3
+    ; check: ushr_imm v5, 63
+    ; check: v7 = iadd v5, v6
+    ; check: v1 -> v7
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_sdiv64_p625(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 625
+    ; check: iconst.i64 0x346d_c5d6_3886_594b
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 7
+    ; check: ushr_imm v4, 63
+    ; check: v6 = iadd v4, v5
+    ; check: v1 -> v6
+    return v1
+}
diff --git a/cranelift/filetests/filetests/peepmatic/div_by_const_power_of_2.clif b/cranelift/filetests/filetests/peepmatic/div_by_const_power_of_2.clif
new file mode 100644
index 0000000000..a2110a5a75
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/div_by_const_power_of_2.clif
@@ -0,0 +1,292 @@
+test peepmatic
+target i686 baseline
+
+; -------- U32 --------
+
+; ignored
+function %t_udiv32_p0(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 0
+    ; check: udiv_imm v0, 0
+    return v1
+}
+
+; converted to a nop
+function %t_udiv32_p1(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 1
+    ; check: nop
+    return v1
+}
+
+; shift
+function %t_udiv32_p2(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 2
+    ; check: ushr_imm v0, 1
+    return v1
+}
+
+; shift
+function %t_udiv32_p2p31(i32) -> i32 {
+block0(v0: i32):
+    v1 = udiv_imm v0, 0x8000_0000
+    ; check: ushr_imm v0, 31
+    return v1
+}
+
+
+; -------- U64 --------
+
+; ignored
+function %t_udiv64_p0(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 0
+    ; check: udiv_imm v0, 0
+    return v1
+}
+
+; converted to a nop
+function %t_udiv64_p1(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 1
+    ; check: nop
+    return v1
+}
+
+; shift
+function %t_udiv64_p2(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 2
+    ; check: ushr_imm v0, 1
+    return v1
+}
+
+; shift
+function %t_udiv64_p2p63(i64) -> i64 {
+block0(v0: i64):
+    v1 = udiv_imm v0, 0x8000_0000_0000_0000
+    ; check: ushr_imm v0, 63
+    return v1
+}
+
+
+; -------- S32 --------
+
+; ignored
+function %t_sdiv32_p0(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 0
+    ; check: sdiv_imm v0, 0
+    return v1
+}
+
+; converted to a nop
+function %t_sdiv32_p1(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 1
+    ; check: nop
+    return v1
+}
+
+; ignored
+function %t_sdiv32_n1(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -1
+    ; check: sdiv_imm v0, -1
+    return v1
+}
+
+; shift
+function %t_sdiv32_p2(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 2
+    ; check: ushr_imm v0, 31
+    ; check: iadd v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: v1 -> v4
+    return v1
+}
+
+; shift
+function %t_sdiv32_n2(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -2
+    ; check: ushr_imm v0, 31
+    ; check: iadd v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: irsub_imm v4, 0
+    return v1
+}
+
+; shift
+function %t_sdiv32_p4(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 4
+    ; check: v2 = sshr_imm v0, 1
+    ; check: ushr_imm v2, 30
+    ; check: iadd v0, v3
+    ; check: v5 = sshr_imm v4, 2
+    ; check: v1 -> v5
+
+    return v1
+}
+
+; shift
+function %t_sdiv32_n4(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 30
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 2
+    ; check: irsub_imm v5, 0
+    return v1
+}
+
+; shift
+function %t_sdiv32_p2p30(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, 0x4000_0000
+    ; check: sshr_imm v0, 29
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: v5 = sshr_imm v4, 30
+    ; check: v1 -> v5
+    return v1
+}
+
+; shift
+function %t_sdiv32_n2p30(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -0x4000_0000
+    ; check: sshr_imm v0, 29
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 30
+    ; check: irsub_imm v5, 0
+    return v1
+}
+
+; there's no positive version of this, since -(-0x8000_0000) isn't
+; representable.
+function %t_sdiv32_n2p31(i32) -> i32 {
+block0(v0: i32):
+    v1 = sdiv_imm v0, -0x8000_0000
+    ; check: sshr_imm v0, 30
+    ; check: ushr_imm v2, 1
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 31
+    ; check: irsub_imm v5, 0
+    return v1
+}
+
+
+; -------- S64 --------
+
+; ignored
+function %t_sdiv64_p0(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 0
+    ; check: sdiv_imm v0, 0
+    return v1
+}
+
+; converted to a nop
+function %t_sdiv64_p1(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 1
+    ; check: nop
+    return v1
+}
+
+; ignored
+function %t_sdiv64_n1(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -1
+    ; check: sdiv_imm v0, -1
+    return v1
+}
+
+; shift
+function %t_sdiv64_p2(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 2
+    ; check: ushr_imm v0, 63
+    ; check: iadd v0, v2
+    ; check: v4 = sshr_imm v3, 1
+    ; check: v1 -> v4
+    return v1
+}
+
+; shift
+function %t_sdiv64_n2(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -2
+    ; check: ushr_imm v0, 63
+    ; check: iadd v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: irsub_imm v4, 0
+    return v1
+}
+
+; shift
+function %t_sdiv64_p4(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 62
+    ; check: iadd v0, v3
+    ; check: v5 = sshr_imm v4, 2
+    ; check: v1 -> v5
+    return v1
+}
+
+; shift
+function %t_sdiv64_n4(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 62
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 2
+    ; check: irsub_imm v5, 0
+    return v1
+}
+
+; shift
+function %t_sdiv64_p2p62(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, 0x4000_0000_0000_0000
+    ; check: sshr_imm v0, 61
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: v5 = sshr_imm v4, 62
+    ; check: v1 -> v5
+    return v1
+}
+
+; shift
+function %t_sdiv64_n2p62(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -0x4000_0000_0000_0000
+    ; check: sshr_imm v0, 61
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 62
+    ; check: irsub_imm v5, 0
+    return v1
+}
+
+; there's no positive version of this, since -(-0x8000_0000_0000_0000) isn't
+; representable.
+function %t_sdiv64_n2p63(i64) -> i64 {
+block0(v0: i64):
+    v1 = sdiv_imm v0, -0x8000_0000_0000_0000
+    ; check: sshr_imm v0, 62
+    ; check: ushr_imm v2, 1
+    ; check: iadd v0, v3
+    ; check: sshr_imm v4, 63
+    ; check: irsub_imm v5, 0
+    return v1
+}
diff --git a/cranelift/filetests/filetests/peepmatic/do_not_keep_applying_optimizations_after_replacing_with_an_alias.clif b/cranelift/filetests/filetests/peepmatic/do_not_keep_applying_optimizations_after_replacing_with_an_alias.clif
new file mode 100644
index 0000000000..cc24167267
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/do_not_keep_applying_optimizations_after_replacing_with_an_alias.clif
@@ -0,0 +1,14 @@
+test peepmatic
+target x86_64
+
+;; This file used to trigger assertions where we would keep trying to
+;; unnecessarily apply optimizations after replacing an instruction with an
+;; alias of another value that we had already optimized.
+
+function %foo() {
+block0:
+    v0 = iconst.i32 3
+    v1 = srem_imm v0, 2
+    v2 = sdiv_imm v1, 1
+    trap unreachable
+}
diff --git a/cranelift/filetests/filetests/peepmatic/do_not_reorder_instructions_when_transplanting.clif b/cranelift/filetests/filetests/peepmatic/do_not_reorder_instructions_when_transplanting.clif
new file mode 100644
index 0000000000..7fc95f0fdb
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/do_not_reorder_instructions_when_transplanting.clif
@@ -0,0 +1,22 @@
+test peepmatic
+target x86_64
+
+;; Test that although v5 can be replaced with v1, we don't transplant `load.i32
+;; v0` on top of `iadd v3, v4`, because that would move the load past other uses
+;; of its result.
+
+function %foo(i64) -> i32 {
+block0(v0: i64):
+    v1 = load.i32 v0
+    v2 = iconst.i32 16
+    v3 = iadd_imm v1, -16
+    v4 = iconst.i32 16
+    v5 = iadd v3, v4
+    ; check:  v1 = load.i32 v0
+    ; nextln: v5 -> v1
+    ; nextln: v2 = iconst.i32 16
+    ; nextln: v3 = iadd_imm v1, -16
+    ; nextln: v4 = iconst.i32 16
+    ; nextln: nop
+    return v5
+}
diff --git a/cranelift/filetests/filetests/peepmatic/fold-extended-move-wraparound.clif b/cranelift/filetests/filetests/peepmatic/fold-extended-move-wraparound.clif
new file mode 100644
index 0000000000..e48b91a4b1
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/fold-extended-move-wraparound.clif
@@ -0,0 +1,14 @@
+test peepmatic
+target x86_64
+
+function %wraparound(i64 vmctx) -> f32 system_v {
+    gv0 = vmctx
+    gv1 = iadd_imm.i64 gv0, 48
+
+block35(v0: i64):
+    v88 = iconst.i64 0
+    v89 = iconst.i64 0x8000_0000_0000_0000
+    v90 = ishl_imm v88, 0x8000_0000_0000_0000
+    v91 = sshr v90, v89; check: sshr_imm v90, 0x8000_0000_0000_0000
+    trap user0
+}
diff --git a/cranelift/filetests/filetests/peepmatic/rem_by_const_non_power_of_2.clif b/cranelift/filetests/filetests/peepmatic/rem_by_const_non_power_of_2.clif
new file mode 100644
index 0000000000..7df5baf4e3
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/rem_by_const_non_power_of_2.clif
@@ -0,0 +1,285 @@
+test peepmatic
+target i686 baseline
+
+; -------- U32 --------
+
+; complex case (mul, sub, shift, add, shift)
+function %t_urem32_p7(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 7
+    ; check: iconst.i32 0x2492_4925
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: ushr_imm v6, 2
+    ; check: imul_imm v7, 7
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case (mul, shift)
+function %t_urem32_p125(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 125
+    ; check: iconst.i32 0x1062_4dd3
+    ; check: umulhi v0, v2
+    ; check: ushr_imm v3, 3
+    ; check: imul_imm v4, 125
+    ; check: isub v0, v5
+    return v1
+}
+
+; simple case w/ shift by zero (mul)
+function %t_urem32_p641(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 641
+    ; check: iconst.i32 0x0066_3d81
+    ; check: umulhi v0, v2
+    ; check: imul_imm v3, 641
+    ; check: isub v0, v4
+    return v1
+}
+
+
+; -------- S32 --------
+
+; simple case w/ shift by zero (mul, add-sign-bit)
+function %t_srem32_n6(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -6
+    ; check: iconst.i32 0xffff_ffff_d555_5555
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 31
+    ; check: iadd v3, v4
+    ; check: imul_imm v5, -6
+    ; check: isub v0, v6
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_srem32_n5(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -5
+    ; check: iconst.i32 0xffff_ffff_9999_9999
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: ushr_imm v4, 31
+    ; check: iadd v4, v5
+    ; check: imul_imm v6, -5
+    ; check: isub v0, v7
+    return v1
+}
+
+; case d < 0 && M > 0 (mul, sub, shift, add-sign-bit)
+function %t_srem32_n3(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -3
+    ; check: iconst.i32 0x5555_5555
+    ; check: smulhi v0, v2
+    ; check: isub v3, v0
+    ; check: sshr_imm v4, 1
+    ; check: ushr_imm v5, 31
+    ; check: iadd v5, v6
+    ; check: imul_imm v7, -3
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case w/ shift by zero (mul, add-sign-bit)
+function %t_srem32_p6(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 6
+    ; check: iconst.i32 0x2aaa_aaab
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 31
+    ; check: iadd v3, v4
+    ; check: imul_imm v5, 6
+    ; check: isub v0, v6
+    return v1
+}
+
+; case d > 0 && M < 0 (mull, add, shift, add-sign-bit)
+function %t_srem32_p7(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 7
+    ; check: iconst.i32 0xffff_ffff_9249_2493
+    ; check: smulhi v0, v2
+    ; check: iadd v3, v0
+    ; check: sshr_imm v4, 2
+    ; check: ushr_imm v5, 31
+    ; check: iadd v5, v6
+    ; check: imul_imm v7, 7
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_srem32_p625(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 625
+    ; check: iconst.i32 0x68db_8bad
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 8
+    ; check: ushr_imm v4, 31
+    ; check: iadd v4, v5
+    ; check: imul_imm v6, 625
+    ; check: isub v0, v7
+    return v1
+}
+
+
+; -------- U64 --------
+
+; complex case (mul, sub, shift, add, shift)
+function %t_urem64_p7(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 7
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: ushr_imm v6, 2
+    ; check: imul_imm v7, 7
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case (mul, shift)
+function %t_urem64_p9(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 9
+    ; check: iconst.i64 0xe38e_38e3_8e38_e38f
+    ; check: umulhi v0, v2
+    ; check: ushr_imm v3, 3
+    ; check: imul_imm v4, 9
+    ; check: isub v0, v5
+    return v1
+}
+
+; complex case (mul, sub, shift, add, shift)
+function %t_urem64_p125(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 125
+    ; check: iconst.i64 0x0624_dd2f_1a9f_be77
+    ; check: umulhi v0, v2
+    ; check: isub v0, v3
+    ; check: ushr_imm v4, 1
+    ; check: iadd v5, v3
+    ; check: ushr_imm v6, 6
+    ; check: imul_imm v7, 125
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case w/ shift by zero (mul)
+function %t_urem64_p274177(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 274177
+    ; check: iconst.i64 0x3d30_f19c_d101
+    ; check: umulhi v0, v2
+    ; check: imul_imm v3, 0x0004_2f01
+    ; check: isub v0, v4
+    return v1
+}
+
+
+; -------- S64 --------
+
+; simple case (mul, shift, add-sign-bit)
+function %t_srem64_n625(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -625
+    ; check: iconst.i64 0xcb92_3a29_c779_a6b5
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 7
+    ; check: ushr_imm v4, 63
+    ; check: iadd v4, v5
+    ; check: imul_imm v6, -625
+    ; check: isub v0, v7
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_srem64_n6(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -6
+    ; check: iconst.i64 0xd555_5555_5555_5555
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 63
+    ; check: iadd v3, v4
+    ; check: imul_imm v5, -6
+    ; check: isub v0, v6
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_srem64_n5(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -5
+    ; check: iconst.i64 0x9999_9999_9999_9999
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 1
+    ; check: ushr_imm v4, 63
+    ; check: iadd v4, v5
+    ; check: imul_imm v6, -5
+    ; check: isub v0, v7
+    return v1
+}
+
+; case d < 0 && M > 0 (mul, sub, shift, add-sign-bit)
+function %t_srem64_n3(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -3
+    ; check: iconst.i64 0x5555_5555_5555_5555
+    ; check: smulhi v0, v2
+    ; check: isub v3, v0
+    ; check: sshr_imm v4, 1
+    ; check: ushr_imm v5, 63
+    ; check: iadd v5, v6
+    ; check: imul_imm v7, -3
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case w/ zero shift (mul, add-sign-bit)
+function %t_srem64_p6(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 6
+    ; check: iconst.i64 0x2aaa_aaaa_aaaa_aaab
+    ; check: smulhi v0, v2
+    ; check: ushr_imm v3, 63
+    ; check: iadd v3, v4
+    ; check: imul_imm v5, 6
+    ; check: isub v0, v6
+    return v1
+}
+
+; case d > 0 && M < 0 (mul, add, shift, add-sign-bit)
+function %t_srem64_p15(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 15
+    ; check: iconst.i64 0x8888_8888_8888_8889
+    ; check: smulhi v0, v2
+    ; check: iadd v3, v0
+    ; check: sshr_imm v4, 3
+    ; check: ushr_imm v5, 63
+    ; check: iadd v5, v6
+    ; check: imul_imm v7, 15
+    ; check: isub v0, v8
+    return v1
+}
+
+; simple case (mul, shift, add-sign-bit)
+function %t_srem64_p625(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 625
+    ; check: iconst.i64 0x346d_c5d6_3886_594b
+    ; check: smulhi v0, v2
+    ; check: sshr_imm v3, 7
+    ; check: ushr_imm v4, 63
+    ; check: iadd v4, v5
+    ; check: imul_imm v6, 625
+    ; check: isub v0, v7
+    return v1
+}
diff --git a/cranelift/filetests/filetests/peepmatic/rem_by_const_power_of_2.clif b/cranelift/filetests/filetests/peepmatic/rem_by_const_power_of_2.clif
new file mode 100644
index 0000000000..c795b73c19
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/rem_by_const_power_of_2.clif
@@ -0,0 +1,291 @@
+test peepmatic
+target i686 baseline
+
+; -------- U32 --------
+
+; ignored
+function %t_urem32_p0(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 0
+    ; check: urem_imm v0, 0
+    return v1
+}
+
+; converted to constant zero
+function %t_urem32_p1(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 1
+    ; check: iconst.i32 0
+    return v1
+}
+
+; shift
+function %t_urem32_p2(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 2
+    ; check: band_imm v0, 1
+    return v1
+}
+
+; shift
+function %t_urem32_p2p31(i32) -> i32 {
+block0(v0: i32):
+    v1 = urem_imm v0, 0x8000_0000
+    ; check: band_imm v0, 0x7fff_ffff
+    return v1
+}
+
+
+; -------- U64 --------
+
+; ignored
+function %t_urem64_p0(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 0
+    ; check: urem_imm v0, 0
+    return v1
+}
+
+; converted to constant zero
+function %t_urem64_p1(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 1
+    ; check: iconst.i64 0
+    return v1
+}
+
+; shift
+function %t_urem64_p2(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 2
+    ; check: band_imm v0, 1
+   return v1
+}
+
+; shift
+function %t_urem64_p2p63(i64) -> i64 {
+block0(v0: i64):
+    v1 = urem_imm v0, 0x8000_0000_0000_0000
+    ; check: band_imm v0, 0x7fff_ffff_ffff_ffff
+    return v1
+}
+
+
+; -------- S32 --------
+
+; ignored
+function %t_srem32_n1(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -1
+    ; check: srem_imm v0, -1
+    return v1
+}
+
+; ignored
+function %t_srem32_p0(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 0
+    ; check: srem_imm v0, 0
+    return v1
+}
+
+; converted to constant zero
+function %t_srem32_p1(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 1
+    ; check: iconst.i32 0
+    return v1
+}
+
+; shift
+function %t_srem32_p2(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 2
+    ; check: ushr_imm v0, 31
+    ; check: iadd v0, v2
+    ; check: band_imm v3, -2
+    ; check: isub v0, v4
+    return v1
+}
+
+; shift
+function %t_srem32_n2(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -2
+    ; check: ushr_imm v0, 31
+    ; check: iadd v0, v2
+    ; check: band_imm v3, -2
+    ; check: isub v0, v4
+    return v1
+}
+
+; shift
+function %t_srem32_p4(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 30
+    ; check: iadd v0, v3
+    ; check: band_imm v4, -4
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem32_n4(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 30
+    ; check: iadd v0, v3
+    ; check: band_imm v4, -4
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem32_p2p30(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, 0x4000_0000
+    ; check: sshr_imm v0, 29
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0xffff_ffff_c000_0000
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem32_n2p30(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -0x4000_0000
+    ; check: sshr_imm v0, 29
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0xffff_ffff_c000_0000
+    ; check: isub v0, v5
+    return v1
+}
+
+; there's no positive version of this, since -(-0x8000_0000) isn't
+; representable.
+function %t_srem32_n2p31(i32) -> i32 {
+block0(v0: i32):
+    v1 = srem_imm v0, -0x8000_0000
+    ; check: sshr_imm v0, 30
+    ; check: ushr_imm v2, 1
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0xffff_ffff_8000_0000
+    ; check: isub v0, v5
+    return v1
+}
+
+
+; -------- S64 --------
+
+; ignored
+function %t_srem64_n1(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -1
+    ; check: srem_imm v0, -1
+    return v1
+}
+
+; ignored
+function %t_srem64_p0(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 0
+    ; check: srem_imm v0, 0
+    return v1
+}
+
+; converted to constant zero
+function %t_srem64_p1(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 1
+    ; check: iconst.i64 0
+    return v1
+}
+
+; shift
+function %t_srem64_p2(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 2
+    ; check: ushr_imm v0, 63
+    ; check: iadd v0, v2
+    ; check: band_imm v3, -2
+    ; check: isub v0, v4
+    return v1
+}
+
+; shift
+function %t_srem64_n2(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -2
+    ; check: ushr_imm v0, 63
+    ; check: iadd v0, v2
+    ; check: band_imm v3, -2
+    ; check: isub v0, v4
+    return v1
+}
+
+; shift
+function %t_srem64_p4(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 62
+    ; check: iadd v0, v3
+    ; check: band_imm v4, -4
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem64_n4(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -4
+    ; check: sshr_imm v0, 1
+    ; check: ushr_imm v2, 62
+    ; check: iadd v0, v3
+    ; check: band_imm v4, -4
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem64_p2p62(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, 0x4000_0000_0000_0000
+    ; check: sshr_imm v0, 61
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0xc000_0000_0000_0000
+    ; check: isub v0, v5
+    return v1
+}
+
+; shift
+function %t_srem64_n2p62(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -0x4000_0000_0000_0000
+    ; check: sshr_imm v0, 61
+    ; check: ushr_imm v2, 2
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0xc000_0000_0000_0000
+    ; check: isub v0, v5
+    return v1
+}
+
+; there's no positive version of this, since -(-0x8000_0000_0000_0000) isn't
+; representable.
+function %t_srem64_n2p63(i64) -> i64 {
+block0(v0: i64):
+    v1 = srem_imm v0, -0x8000_0000_0000_0000
+    ; check: sshr_imm v0, 62
+    ; check: ushr_imm v2, 1
+    ; check: iadd v0, v3
+    ; check: band_imm v4, 0x8000_0000_0000_0000
+    ; check: isub v0, v5
+   return v1
+}
diff --git a/cranelift/filetests/filetests/peepmatic/replace_branching_instructions_and_cfg_predecessors.clif b/cranelift/filetests/filetests/peepmatic/replace_branching_instructions_and_cfg_predecessors.clif
new file mode 100644
index 0000000000..17ca472b7e
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/replace_branching_instructions_and_cfg_predecessors.clif
@@ -0,0 +1,22 @@
+test peepmatic
+target x86_64
+
+function u0:2(i64 , i64) {
+    gv1 = load.i64 notrap aligned gv0
+    heap0 = static gv1
+    block0(v0: i64, v1: i64):
+        v16 = iconst.i32 6
+        v17 = heap_addr.i64 heap0, v16, 1
+        v18 = load.i32 v17
+        v19 = iconst.i32 4
+        v20 = icmp ne v18, v19
+        v21 = bint.i32 v20
+        brnz v21, block2
+        jump block4
+    block4:
+        jump block1
+    block2:
+        jump block1
+    block1:
+        return
+}
diff --git a/cranelift/filetests/filetests/peepmatic/simplify32.clif b/cranelift/filetests/filetests/peepmatic/simplify32.clif
new file mode 100644
index 0000000000..b1c6786a05
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/simplify32.clif
@@ -0,0 +1,60 @@
+test peepmatic
+target i686
+
+;; 32-bits platforms.
+
+function %iadd_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = iadd v0, v1
+    return v2
+}
+; sameln: function %iadd_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = iadd_imm v0, 2
+; nextln:     return v2
+; nextln: }
+
+function %isub_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = isub v0, v1
+    return v2
+}
+; sameln: function %isub_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = iadd_imm v0, -2
+; nextln:     return v2
+; nextln: }
+
+function %icmp_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = icmp slt v0, v1
+    v3 = bint.i32 v2
+    return v3
+}
+; sameln: function %icmp_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = icmp_imm slt v0, 2
+; nextln:     v3 = bint.i32 v2
+; nextln:     return v3
+; nextln: }
+
+;; Don't simplify operations that would get illegal because of lack of native
+;; support.
+function %iadd_imm(i64) -> i64 {
+block0(v0: i64):
+    v1 = iconst.i64 2
+    v2 = iadd v0, v1
+    return v2
+}
+; sameln: function %iadd_imm
+; nextln: block0(v0: i64):
+; nextln:     v1 = iconst.i64 2
+; nextln:     v2 = iadd v0, v1
+; nextln:     return v2
+; nextln: }
diff --git a/cranelift/filetests/filetests/peepmatic/simplify64.clif b/cranelift/filetests/filetests/peepmatic/simplify64.clif
new file mode 100644
index 0000000000..93c289ccdd
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/simplify64.clif
@@ -0,0 +1,326 @@
+test peepmatic
+target x86_64
+
+;; 64-bits platforms.
+
+function %iadd_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = iadd v0, v1
+    return v2
+}
+; sameln: function %iadd_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = iadd_imm v0, 2
+; nextln:     return v2
+; nextln: }
+
+function %isub_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = isub v0, v1
+    return v2
+}
+; sameln: function %isub_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = iadd_imm v0, -2
+; nextln:     return v2
+; nextln: }
+
+function %icmp_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = icmp slt v0, v1
+    v3 = bint.i32 v2
+    return v3
+}
+; sameln: function %icmp_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = icmp_imm slt v0, 2
+; nextln:     v3 = bint.i32 v2
+; nextln:     return v3
+; nextln: }
+
+function %ifcmp_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = ifcmp v0, v1
+    brif eq v2, block1
+    jump block2
+
+block1:
+    v3 = iconst.i32 1
+    return v3
+
+block2:
+    v4 = iconst.i32 2
+    return v4
+}
+; sameln: function %ifcmp_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = ifcmp_imm v0, 2
+; nextln:     brif eq v2, block1
+; nextln:     jump block2
+; nextln: 
+; nextln: block1:
+; nextln:     v3 = iconst.i32 1
+; nextln:     return v3
+; nextln: 
+; nextln: block2:
+; nextln:     v4 = iconst.i32 2
+; nextln:     return v4
+; nextln: }
+
+function %brz_bint(i32) {
+block0(v0: i32):
+    v3 = icmp_imm slt v0, 0
+    v1 = bint.i32 v3
+    v2 = select v1, v1, v1
+    trapz v1, user0
+    brz v1, block1
+    jump block2
+
+block1:
+    return
+
+block2:
+    return
+}
+; sameln: function %brz_bint
+; nextln: (v0: i32):
+; nextln:    v3 = icmp_imm slt v0, 0
+; nextln:    v1 = bint.i32 v3
+; nextln:    v2 = select v3, v1, v1
+; nextln:    trapz v3, user0
+; nextln:    brnz v3, block2
+; nextln:    jump block1
+
+function %irsub_imm(i32) -> i32 {
+block0(v0: i32):
+    v1 = iconst.i32 2
+    v2 = isub v1, v0
+    return v2
+}
+; sameln: function %irsub_imm
+; nextln: block0(v0: i32):
+; nextln:     v1 = iconst.i32 2
+; nextln:     v2 = irsub_imm v0, 2
+; nextln:     return v2
+; nextln: }
+
+;; Sign-extensions.
+
+;; 8 -> 16
+function %uextend_8_16() -> i16 {
+block0:
+    v0 = iconst.i16 37
+    v1 = ishl_imm v0, 8
+    v2 = ushr_imm v1, 8
+    return v2
+}
+; sameln: function %uextend_8_16
+; nextln: block0:
+; nextln:     v0 = iconst.i16 37
+; nextln:     v1 = ishl_imm v0, 8
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = uextend.i16 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_8_16() -> i16 {
+block0:
+    v0 = iconst.i16 37
+    v1 = ishl_imm v0, 8
+    v2 = sshr_imm v1, 8
+    return v2
+}
+; sameln: function %sextend_8_16
+; nextln: block0:
+; nextln:     v0 = iconst.i16 37
+; nextln:     v1 = ishl_imm v0, 8
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = sextend.i16 v3
+; nextln:     return v2
+; nextln: }
+
+;; 8 -> 32
+function %uextend_8_32() -> i32 {
+block0:
+    v0 = iconst.i32 37
+    v1 = ishl_imm v0, 24
+    v2 = ushr_imm v1, 24
+    return v2
+}
+; sameln: function %uextend_8_32
+; nextln: block0:
+; nextln:     v0 = iconst.i32 37
+; nextln:     v1 = ishl_imm v0, 24
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = uextend.i32 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_8_32() -> i32 {
+block0:
+    v0 = iconst.i32 37
+    v1 = ishl_imm v0, 24
+    v2 = sshr_imm v1, 24
+    return v2
+}
+; sameln: function %sextend_8_32
+; nextln: block0:
+; nextln:     v0 = iconst.i32 37
+; nextln:     v1 = ishl_imm v0, 24
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = sextend.i32 v3
+; nextln:     return v2
+; nextln: }
+
+;; 16 -> 32
+function %uextend_16_32() -> i32 {
+block0:
+    v0 = iconst.i32 37
+    v1 = ishl_imm v0, 16
+    v2 = ushr_imm v1, 16
+    return v2
+}
+; sameln: function %uextend_16_32
+; nextln: block0:
+; nextln:     v0 = iconst.i32 37
+; nextln:     v1 = ishl_imm v0, 16
+; nextln:     v3 = ireduce.i16 v0
+; nextln:     v2 = uextend.i32 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_16_32() -> i32 {
+block0:
+    v0 = iconst.i32 37
+    v1 = ishl_imm v0, 16
+    v2 = sshr_imm v1, 16
+    return v2
+}
+; sameln: function %sextend_16_32
+; nextln: block0:
+; nextln:     v0 = iconst.i32 37
+; nextln:     v1 = ishl_imm v0, 16
+; nextln:     v3 = ireduce.i16 v0
+; nextln:     v2 = sextend.i32 v3
+; nextln:     return v2
+; nextln: }
+
+;; 8 -> 64
+function %uextend_8_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 56
+    v2 = ushr_imm v1, 56
+    return v2
+}
+; sameln: function %uextend_8_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 56
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = uextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_8_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 56
+    v2 = sshr_imm v1, 56
+    return v2
+}
+; sameln: function %sextend_8_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 56
+; nextln:     v3 = ireduce.i8 v0
+; nextln:     v2 = sextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+;; 16 -> 64
+function %uextend_16_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 48
+    v2 = ushr_imm v1, 48
+    return v2
+}
+; sameln: function %uextend_16_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 48
+; nextln:     v3 = ireduce.i16 v0
+; nextln:     v2 = uextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_16_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 48
+    v2 = sshr_imm v1, 48
+    return v2
+}
+; sameln: function %sextend_16_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 48
+; nextln:     v3 = ireduce.i16 v0
+; nextln:     v2 = sextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+;; 32 -> 64
+function %uextend_32_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 32
+    v2 = ushr_imm v1, 32
+    return v2
+}
+; sameln: function %uextend_32_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 32
+; nextln:     v3 = ireduce.i32 v0
+; nextln:     v2 = uextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+function %sextend_32_64() -> i64 {
+block0:
+    v0 = iconst.i64 37
+    v1 = ishl_imm v0, 32
+    v2 = sshr_imm v1, 32
+    return v2
+}
+; sameln: function %sextend_32_64
+; nextln: block0:
+; nextln:     v0 = iconst.i64 37
+; nextln:     v1 = ishl_imm v0, 32
+; nextln:     v3 = ireduce.i32 v0
+; nextln:     v2 = sextend.i64 v3
+; nextln:     return v2
+; nextln: }
+
+function %add_imm_fold(i32) -> i32 {
+block0(v0: i32):
+  v1 = iadd_imm v0, 42
+  v2 = iadd_imm v1, -42
+  return v2
+}
+; sameln: function %add_imm_fold(i32)
+; nextln: block0(v0: i32):
+; nextln:    v2 -> v0
+; nextln:    v1 = iadd_imm v0, 42
+; nextln:    nop
+; nextln:    return v2
diff --git a/cranelift/filetests/filetests/peepmatic/simplify_instruction_into_alias_of_value.clif b/cranelift/filetests/filetests/peepmatic/simplify_instruction_into_alias_of_value.clif
new file mode 100644
index 0000000000..3000369bb5
--- /dev/null
+++ b/cranelift/filetests/filetests/peepmatic/simplify_instruction_into_alias_of_value.clif
@@ -0,0 +1,17 @@
+test peepmatic
+target x86_64
+
+;; The `isub` is a no-op, but we can't replace the whole `isub` instruction with
+;; its `v2` operand's instruction because `v2` is one of many results. Instead,
+;; we need to make an alias `v3 -> v2`.
+
+function %replace_inst_with_alias() -> i32 {
+block0:
+    v0 = iconst.i32 0
+    v1, v2 = x86_smulx v0, v0
+    v3 = isub v2, v0
+    ; check:  v0 = iconst.i32 0
+    ; nextln: v1, v2 = x86_smulx v0, v0
+    ; nextln: v3 -> v2
+    return v3
+}
diff --git a/cranelift/filetests/filetests/simple_preopt/do_not_reorder_instructions_when_transplanting.clif b/cranelift/filetests/filetests/simple_preopt/do_not_reorder_instructions_when_transplanting.clif
new file mode 100644
index 0000000000..a1e9f47f5a
--- /dev/null
+++ b/cranelift/filetests/filetests/simple_preopt/do_not_reorder_instructions_when_transplanting.clif
@@ -0,0 +1,22 @@
+test simple_preopt
+target x86_64
+
+;; Test that although v5 can be replaced with v1, we don't transplant `load.i32
+;; v0` on top of `iadd v3, v4`, because that would move the load past other uses
+;; of its result.
+
+function %foo(i64) -> i32 {
+block0(v0: i64):
+    v1 = load.i32 v0
+    v2 = iconst.i32 16
+    v3 = iadd_imm v1, -16
+    v4 = iconst.i32 16
+    v5 = iadd v3, v4
+    ; check:  v1 = load.i32 v0
+    ; nextln: v5 -> v1
+    ; nextln: v2 = iconst.i32 16
+    ; nextln: v3 = iadd_imm v1, -16
+    ; nextln: v4 = iconst.i32 16
+    ; nextln: nop
+    return v5
+}
diff --git a/cranelift/filetests/filetests/simple_preopt/replace_branching_instructions_and_cfg_predecessors.clif b/cranelift/filetests/filetests/simple_preopt/replace_branching_instructions_and_cfg_predecessors.clif
new file mode 100644
index 0000000000..702896c22d
--- /dev/null
+++ b/cranelift/filetests/filetests/simple_preopt/replace_branching_instructions_and_cfg_predecessors.clif
@@ -0,0 +1,22 @@
+test simple_preopt
+target x86_64
+
+function u0:2(i64 , i64) {
+    gv1 = load.i64 notrap aligned gv0
+    heap0 = static gv1
+    block0(v0: i64, v1: i64):
+        v16 = iconst.i32 6
+        v17 = heap_addr.i64 heap0, v16, 1
+        v18 = load.i32 v17
+        v19 = iconst.i32 4
+        v20 = icmp ne v18, v19
+        v21 = bint.i32 v20
+        brnz v21, block2
+        jump block4
+    block4:
+        jump block1
+    block2:
+        jump block1
+    block1:
+        return
+}
diff --git a/cranelift/filetests/filetests/simple_preopt/simplify_instruction_into_alias_of_value.clif b/cranelift/filetests/filetests/simple_preopt/simplify_instruction_into_alias_of_value.clif
new file mode 100644
index 0000000000..076d7b17b5
--- /dev/null
+++ b/cranelift/filetests/filetests/simple_preopt/simplify_instruction_into_alias_of_value.clif
@@ -0,0 +1,17 @@
+test simple_preopt
+target x86_64
+
+;; The `isub` is a no-op, but we can't replace the whole `isub` instruction with
+;; its `v2` operand's instruction because `v2` is one of many results. Instead,
+;; we need to make an alias `v3 -> v2`.
+
+function %replace_inst_with_alias() -> i32 {
+block0:
+    v0 = iconst.i32 0
+    v1, v2 = x86_smulx v0, v0
+    v3 = isub v2, v0
+    ; check:  v0 = iconst.i32 0
+    ; nextln: v1, v2 = x86_smulx v0, v0
+    ; nextln: v3 -> v2
+    return v3
+}
diff --git a/cranelift/filetests/src/lib.rs b/cranelift/filetests/src/lib.rs
index bc1a6df1e2..5cf7331225 100644
--- a/cranelift/filetests/src/lib.rs
+++ b/cranelift/filetests/src/lib.rs
@@ -45,6 +45,7 @@ mod test_domtree;
 mod test_interpret;
 mod test_legalizer;
 mod test_licm;
+mod test_peepmatic;
 mod test_postopt;
 mod test_preopt;
 mod test_print_cfg;
@@ -128,6 +129,7 @@ fn new_subtest(parsed: &TestCommand) -> subtest::SubtestResult<Box<dyn subtest::
         "interpret" => test_interpret::subtest(parsed),
         "legalizer" => test_legalizer::subtest(parsed),
         "licm" => test_licm::subtest(parsed),
+        "peepmatic" => test_peepmatic::subtest(parsed),
         "postopt" => test_postopt::subtest(parsed),
         "preopt" => test_preopt::subtest(parsed),
         "print-cfg" => test_print_cfg::subtest(parsed),
diff --git a/cranelift/filetests/src/test_peepmatic.rs b/cranelift/filetests/src/test_peepmatic.rs
new file mode 100644
index 0000000000..fc701c7046
--- /dev/null
+++ b/cranelift/filetests/src/test_peepmatic.rs
@@ -0,0 +1,56 @@
+//! Test command for `peepmatic`-generated peephole optimizers.
+
+use crate::subtest::{run_filecheck, Context, SubTest, SubtestResult};
+use cranelift_codegen;
+use cranelift_codegen::ir::Function;
+use cranelift_codegen::print_errors::pretty_error;
+use cranelift_reader::TestCommand;
+use std::borrow::Cow;
+
+struct TestPreopt;
+
+pub fn subtest(parsed: &TestCommand) -> SubtestResult<Box<dyn SubTest>> {
+    assert_eq!(parsed.command, "peepmatic");
+    if parsed.options.is_empty() {
+        Ok(Box::new(TestPreopt))
+    } else {
+        Err(format!("No options allowed on {}", parsed))
+    }
+}
+
+impl SubTest for TestPreopt {
+    fn name(&self) -> &'static str {
+        "peepmatic"
+    }
+
+    fn is_mutating(&self) -> bool {
+        true
+    }
+
+    fn needs_isa(&self) -> bool {
+        true
+    }
+
+    fn run(&self, func: Cow<Function>, context: &Context) -> SubtestResult<()> {
+        let mut comp_ctx = cranelift_codegen::Context::for_function(func.into_owned());
+        let isa = context.isa.expect("preopt needs an ISA");
+
+        comp_ctx.compute_cfg();
+        comp_ctx
+            .preopt(isa)
+            .map_err(|e| pretty_error(&comp_ctx.func, context.isa, Into::into(e)))?;
+        let text = &comp_ctx.func.display(isa).to_string();
+        log::debug!("After peepmatic-based simple_preopt:\n{}", text);
+
+        // Only actually run the filecheck if peepmatic is enabled, because it
+        // can generate slightly different code (alias a result vs replace an
+        // instruction) than the non-peepmatic versions of peephole
+        // optimizations. Note that the non-`peepmatic` results can be tested
+        // with the `test simple_preopt` subtest.
+        if cfg!(feature = "enable-peepmatic") {
+            run_filecheck(&text, context)
+        } else {
+            Ok(())
+        }
+    }
+}
diff --git a/cranelift/filetests/src/test_simple_preopt.rs b/cranelift/filetests/src/test_simple_preopt.rs
index 286a86ba23..f6cdec391f 100644
--- a/cranelift/filetests/src/test_simple_preopt.rs
+++ b/cranelift/filetests/src/test_simple_preopt.rs
@@ -38,6 +38,17 @@ impl SubTest for TestSimplePreopt {
             .preopt(isa)
             .map_err(|e| pretty_error(&comp_ctx.func, context.isa, Into::into(e)))?;
         let text = &comp_ctx.func.display(isa).to_string();
-        run_filecheck(&text, context)
+        log::debug!("After simple_preopt:\n{}", text);
+
+        // Only actually run the filecheck if peepmatic is *not* enabled,
+        // because it can generate slightly different code (alias a result vs
+        // replace an instruction) than the non-peepmatic versions of peephole
+        // optimizations. Note that the `peepmatic`-based results can be tested
+        // with the `test peepmatic` subtest.
+        if cfg!(feature = "enable-peepmatic") {
+            Ok(())
+        } else {
+            run_filecheck(&text, context)
+        }
     }
 }
diff --git a/cranelift/peepmatic/Cargo.toml b/cranelift/peepmatic/Cargo.toml
new file mode 100644
index 0000000000..abe9676f0b
--- /dev/null
+++ b/cranelift/peepmatic/Cargo.toml
@@ -0,0 +1,15 @@
+[package]
+name = "peepmatic"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+anyhow = "1.0.27"
+peepmatic-automata = { version = "0.1.0", path = "crates/automata", features = ["dot"] }
+peepmatic-macro = { version = "0.1.0", path = "crates/macro" }
+peepmatic-runtime = { version = "0.1.0", path = "crates/runtime", features = ["construct"] }
+wast = "15.0.0"
+z3 = { version = "0.5.1", features = ["static-link-z3"] }
diff --git a/cranelift/peepmatic/README.md b/cranelift/peepmatic/README.md
new file mode 100644
index 0000000000..550f6d310d
--- /dev/null
+++ b/cranelift/peepmatic/README.md
@@ -0,0 +1,423 @@
+<div align="center">
+  <h1><code>peepmatic</code></h1>
+
+  <p>
+    <b>
+      <code>peepmatic</code> is a DSL and compiler for peephole optimizers for
+      <a href="https://github.com/bytecodealliance/wasmtime/tree/master/cranelift#readme">Cranelift</a>.
+    </b>
+  </p>
+
+  <img src="https://github.com/fitzgen/peepmatic/workflows/Rust/badge.svg"/>
+
+</div>
+
+<!-- START doctoc generated TOC please keep comment here to allow auto update -->
+<!-- DON'T EDIT THIS SECTION, INSTEAD RE-RUN doctoc TO UPDATE -->
+
+
+- [About](#about)
+- [Example](#example)
+- [A DSL for Optimizations](#a-dsl-for-optimizations)
+  - [Variables](#variables)
+  - [Constants](#constants)
+  - [Nested Patterns](#nested-patterns)
+  - [Preconditions and Unquoting](#preconditions-and-unquoting)
+  - [Bit Widths](#bit-widths)
+- [Implementation](#implementation)
+  - [Parsing](#parsing)
+  - [Type Checking](#type-checking)
+  - [Linearization](#linearization)
+  - [Automatization](#automatization)
+- [References](#references)
+- [Acknowledgments](#acknowledgments)
+
+<!-- END doctoc generated TOC please keep comment here to allow auto update -->
+
+## About
+
+Peepmatic is a DSL for peephole optimizations and compiler for generating
+peephole optimizers from them. The user writes a set of optimizations in the
+DSL, and then `peepmatic` compiles the set of optimizations into an efficient
+peephole optimizer:
+
+```
+DSL ----peepmatic----> Peephole Optimizer
+```
+
+The generated peephole optimizer has all of its optimizations' left-hand sides
+collapsed into a compact automata that makes matching candidate instruction
+sequences fast.
+
+The DSL's optimizations may be written by hand or discovered mechanically with a
+superoptimizer like [Souper][]. Eventually, `peepmatic` should have a verifier
+that ensures that the DSL's optimizations are sound, similar to what [Alive][]
+does for LLVM optimizations.
+
+Currently, `peepmatic` is targeting peephole optimizers that operate on
+Cranelift's clif intermediate representation. The intended next target is
+Cranelift's new backend's "vcode" intermediate representation. Supporting
+non-Cranelift targets is not a goal.
+
+[Cranelift]: https://github.com/bytecodealliance/wasmtime/tree/master/cranelift#readme
+[Souper]: https://github.com/google/souper
+[Alive]: https://github.com/AliveToolkit/alive2
+
+## Example
+
+This snippet of our DSL describes optimizations for removing redundant
+bitwise-or instructions that are no-ops:
+
+```lisp
+(=> (bor $x (bor $x $y))
+    (bor $x $y))
+
+(=> (bor $y (bor $x $y))
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $x)
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $y)
+    (bor $x $y))
+```
+
+When compiled into a peephole optimizer automaton, they look like this:
+
+![](examples/redundant-bor.png)
+
+## A DSL for Optimizations
+
+A single peephole optimization has two parts:
+
+1. A **left-hand side** that describes candidate instruction sequences that the
+   optimization applies to.
+2. A **right-hand side** that contains the new instruction sequence that
+   replaces old instruction sequences that the left-hand side matched.
+
+A left-hand side may bind sub-expressions to variables and the right-hand side
+may contain those bound variables to reuse the sub-expressions. The operations
+inside the left-hand and right-hand sides are a subset of clif operations.
+
+Let's take a look at an example:
+
+```lisp
+(=> (imul $x 2)
+    (ishl $x 1))
+```
+
+As you can see, the DSL uses S-expressions. (S-expressions are easy to parse and
+we also have a bunch of nice parsing infrastructure for S-expressions already
+for our [`wat`][wat] and [`wast`][wast] crates.)
+
+[wat]: https://crates.io/crates/wat
+[wast]: https://crates.io/crates/wast
+
+The left-hand side of this optimization is `(imul $x 2)`. It matches integer
+multiplication operations where a value is multiplied by the constant two. The
+value multiplied by two is bound to the variable `$x`.
+
+The right-hand side of this optimization is `(ishl $x 1)`. It reuses the `$x`
+variable that was bound in the left-hand side.
+
+This optimization replaces expressions of the form `x * 2` with `x << 1`. This
+is sound because multiplication by two is the same as shifting left by one for
+binary integers, and it is desirable because a shift-left instruction executes
+in fewer cycles than a multiplication.
+
+The general form of an optimization is:
+
+```lisp
+(=> <left-hand-side> <right-hand-side>)
+```
+
+### Variables
+
+Variables begin with a dollar sign and are followed by lowercase letters,
+numbers, hyphens, and underscores: `$x`, `$y`, `$my-var`, `$operand2`.
+
+Left-hand side patterns may contain variables that match any kind of
+sub-expression and give it a name so that it may be reused in the right-hand
+side.
+
+```lisp
+;; Replace `x + 0` with simply `x`.
+(=> (iadd $x 0)
+    $x)
+```
+
+Within a pattern, every occurrence of a variable with the same name must match
+the same value. That is `(iadd $x $x)` matches `(iadd 1 1)` but does not match
+`(iadd 1 2)`. This lets us write optimizations such as this:
+
+```lisp
+;; Xor'ing a value with itself is always zero.
+(=> (bxor $x $x)
+    (iconst 0))
+```
+
+### Constants
+
+We've already seen specific integer literals and wildcard variables in patterns,
+but we can also match any constant. These are written similar to variables, but
+use uppercase letters rather than lowercase: `$C`, `$MY-CONST`, and `$OPERAND2`.
+
+For example, we can use constant patterns to combine an `iconst` and `iadd` into
+a single `iadd_imm` instruction:
+
+```lisp
+(=> (iadd (iconst $C) $x)
+    (iadd_imm $C $x))
+```
+
+### Nested Patterns
+
+Patterns can also match nested operations with their own nesting:
+
+```lisp
+(=> (bor $x (bor $x $y))
+    (bor $x $y))
+```
+
+### Preconditions and Unquoting
+
+Let's reconsider our first example optimization:
+
+```lisp
+(=> (imul $x 2)
+    (ishl $x 1))
+```
+
+This optimization is a little too specific. Here is another version of this
+optimization that we'd like to support:
+
+```lisp
+(=> (imul $x 4)
+    (ishl $x 2))
+```
+
+We don't want to have to write out all instances of this general class of
+optimizations! That would be a lot of repetition and could also bloat the size
+of our generated peephole optimizer's matching automata.
+
+Instead, we can generalize this optimization by matching any multiplication by a
+power of two constant `C` and replacing it with a shift left of `log2(C)`.
+
+First, rather than match `2` directly, we want to match any constant variable `C`:
+
+```lisp
+(imul $x $C)
+```
+
+Note that variables begin with lowercase letters, while constants begin with
+uppercase letters. Both the constant pattern `$C` and variable pattern `$x` will
+match `5`, but only the variable pattern `$x` will match a whole sub-expression
+like `(iadd 1 2)`. The constant pattern `$C` only matches constant values.
+
+Next, we augment our left-hand side's pattern with a **precondition** that the
+constant `$C` must be a power of two. Preconditions are introduced by wrapping
+a pattern in the `when` form:
+
+```lisp
+;; Our new left-hand side, augmenting a pattern with a precondition!
+(when
+  ;; The pattern matching multiplication by a constant value.
+  (imul $x $C)
+
+  ;; The precondition that $C must be a power of two.
+  (is-power-of-two $C))
+ ```
+
+In the right-hand side, we use **unquoting** to perform compile-time evaluation
+of `log2($C)`. Unquoting is done with the `$(...)` form:
+
+```lisp
+;; Our new right-hand side, using unqouting to do compile-time evaluation of
+;; constants that were matched and bound in the left-hand side!
+(ishl $x $(log2 $C))
+```
+
+Finally, here is the general optimization putting our new left-hand and
+right-hand sides together:
+
+```lisp
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $(log2 $C)))
+```
+
+### Bit Widths
+
+Similar to how Cranelift's instructions are bit-width polymorphic, `peepmatic`
+optimizations are also bit-width polymorphic. Unless otherwise specified, a
+pattern will match expressions manipulating `i32`s just the same as expressions
+manipulating `i64`s, etc... An optimization that doesn't constrain its pattern's
+bit widths must be valid for all bit widths:
+
+* 1
+* 8
+* 16
+* 32
+* 64
+* 128
+
+To constrain an optimization to only match `i32`s, for example, you can use the
+`bit-width` precondition:
+
+```lisp
+(=> (when (iadd $x $y)
+          (bit-width $x 32)
+          (bit-width $y 32))
+    ...)
+```
+
+Alternatively, you can ascribe a type to an operation by putting the type inside
+curly brackets after the operator, like this:
+
+```lisp
+(=> (when (sextend{i64} (ireduce{i32} $x))
+          (bit-width $x 64))
+    (sshr (ishl $x 32) 32))
+```
+
+## Implementation
+
+Peepmatic has roughly four phases:
+
+1. Parsing
+2. Type Checking
+3. Linearization
+4. Automatization
+
+(I say "roughly" because there are a couple micro-passes that happen after
+linearization and before automatization. But those are the four main phases.)
+
+### Parsing
+
+Parsing transforms the DSL source text into an abstract syntax tree (AST).
+
+We use [the `wast` crate][wast]. It gives us nicely formatted errors with source
+context, as well as some other generally nice-to-have parsing infrastructure.
+
+Relevant source files:
+
+* `src/parser.rs`
+* `src/ast.rs`
+
+[wast]: https://crates.io/crates/wast
+
+### Type Checking
+
+Type checking operates on the AST. It checks that types and bit widths in the
+optimizations are all valid. For example, it ensures that the type and bit width
+of an optimization's left-hand side is the same as its right-hand side, because
+it doesn't make sense to replace an integer expression with a boolean
+expression.
+
+After type checking is complete, certain AST nodes are assigned a type and bit
+width, that are later used in linearization and when matching and applying
+optimizations.
+
+We walk the AST and gather type constraints. Every constraint is associated with
+a span in the source file. We hand these constraints off to Z3. In the case that
+there are type errors (i.e. Z3 returns `unsat`), we get the constraints that are
+in conflict with each othe via `z3::Solver::get_unsat_core` and report the type
+errors to the user, with the source context, thanks to the constraints'
+associated spans.
+
+Using Z3 not only makes implementing type checking easier than it otherwise
+would be, but makes it that much easier to extend type checking with searching
+for counterexample inputs in the future. That is, inputs for which the RHS is
+not equivalent to the LHS, implying that the optimization is unsound.
+
+Relevant source files:
+
+* `src/verify.rs`
+
+### Linearization
+
+Linearization takes the AST of optimizations and converts each optimization into
+a linear form. The goal is to make automaton construction easier in the
+automatization step, as well as simplifying the language to make matching and
+applying optimizations easier.
+
+Each optimization's left-hand side is converted into a sequence of
+
+* match operation,
+* path to the instruction/value/immediate to which the operation is applied, and
+* expected result of the operation.
+
+All match operations must have the expected result for the optimization to be
+applicable to an instruction sequence.
+
+Each optimization's right-hand side is converted into a sequence of build
+actions. These are commands that describe how to construct the right-hand side,
+given that the left-hand side has been matched.
+
+Relevant source files:
+
+* `src/linearize.rs`
+* `src/linear_passes.rs`
+* `crates/runtime/src/linear.rs`
+
+### Automatization
+
+Automatization takes a set of linear optimizations and combines them into a
+transducer automaton. This automaton is the final, compiled peephole
+optimizations. The goal is to de-duplicate as much as we can from all the linear
+optimizations, producing as compact and cache-friendly a representation as we
+can.
+
+Plain automata can tell you whether it matches an input string. It can be
+thought of as a compact representation of a set of strings. A transducer is a
+type of automaton that doesn't just match input strings, but can map them to
+output values. It can be thought of as a compact representation of a dictionary
+or map. By using transducers, we de-duplicate not only the prefix and suffix of
+the match operations, but also the right-hand side build actions.
+
+Each state in the emitted transducers is associated with a match operation and
+path. The transitions out of that state are over the result of the match
+operation. Each transition optionally accumulates some RHS build actions. By the
+time we reach a final state, the RHS build actions are complete and can be
+interpreted to apply the matched optimization.
+
+The relevant source files for constructing the transducer automaton are:
+
+* `src/automatize.rs`
+* `crates/automata/src/lib.rs`
+
+The relevant source files for the runtime that interprets the transducers and
+applies optimizations are:
+
+* `crates/runtime/src/optimizations.rs`
+* `crates/runtime/src/optimizer.rs`
+
+## References
+
+I found these resources helpful when designing `peepmatic`:
+
+* [Extending tree pattern matching for application to peephole
+  optimizations](https://pure.tue.nl/ws/portalfiles/portal/125543109/Thesis_JanekvOirschot.pdf)
+  by van Oirschot
+
+* [Interpreted Pattern Match Execution for
+  MLIR](https://drive.google.com/drive/folders/1hb_sXbdMbIz95X-aaa6Vf5wSYRwsJuve)
+  by Jeff Niu
+
+* [Direct Construction of Minimal Acyclic Subsequential
+  Transducers](http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.24.3698&rep=rep1&type=pdf)
+  by Mihov and Maurel
+
+* [Index 1,600,000,000 Keys with Automata and
+  Rust](https://blog.burntsushi.net/transducers/) and [the `fst`
+  crate](https://crates.io/crates/fst) by Andrew Gallant
+
+## Acknowledgments
+
+Thanks to [Jubi Taneja], [Dan Gohman], [John Regehr], and [Nuno Lopes] for their
+input in design discussions and for sharing helpful resources!
+
+[Jubi Taneja]: https://www.cs.utah.edu/~jubi/
+[Dan Gohman]: https://github.com/sunfishcode
+[John Regehr]: https://www.cs.utah.edu/~regehr/
+[Nuno Lopes]: http://web.ist.utl.pt/nuno.lopes/
diff --git a/cranelift/peepmatic/crates/automata/Cargo.toml b/cranelift/peepmatic/crates/automata/Cargo.toml
new file mode 100644
index 0000000000..27c89230af
--- /dev/null
+++ b/cranelift/peepmatic/crates/automata/Cargo.toml
@@ -0,0 +1,18 @@
+[package]
+name = "peepmatic-automata"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+
+[package.metadata.docs.rs]
+all-features = true
+
+[dependencies]
+serde = { version = "1.0.106", optional = true }
+
+[features]
+# Enable support for generating GraphViz Dot files that can be used to visually
+# render an automaton.
+#
+# https://en.wikipedia.org/wiki/DOT_%28graph_description_language%29
+dot = []
diff --git a/cranelift/peepmatic/crates/automata/src/dot.rs b/cranelift/peepmatic/crates/automata/src/dot.rs
new file mode 100644
index 0000000000..bc102d1f81
--- /dev/null
+++ b/cranelift/peepmatic/crates/automata/src/dot.rs
@@ -0,0 +1,273 @@
+//! Helpers for generating [GraphViz
+//! Dot](https://graphviz.gitlab.io/_pages/pdf/dotguide.pdf) files to visually
+//! render automata.
+//!
+//! **This module only exists when the `"dot"` cargo feature is enabled.**
+
+use crate::{Automaton, Output, State};
+use std::fmt::{Debug, Display};
+use std::fs;
+use std::hash::Hash;
+use std::io::{self, Write};
+use std::path::Path;
+
+/// Format the user-provided bits of an `Automaton` for Graphviz Dot output.
+///
+/// There are two provided implementations of `DotFmt`:
+///
+/// * [`DebugDotFmt`][crate::dot::DebugDotFmt] -- format each type parameter
+///   with its `std::fmt::Debug` implementation.
+///
+/// * [`DisplayDotFmt`][crate::dot::DisplayDotFmt] -- format each type parameter
+///   with its `std::fmt::Display` implementation.
+///
+/// You can also implement this trait yourself if your type parameters don't
+/// implement `Debug` or `Display`, or if you want to format them in some other
+/// way.
+pub trait DotFmt<TAlphabet, TState, TOutput> {
+    /// Format a transition edge: `from ---input---> to`.
+    ///
+    /// This will be inside an [HTML
+    /// label](https://www.graphviz.org/doc/info/shapes.html#html), so you may
+    /// use balanced HTML tags.
+    fn fmt_transition(
+        &self,
+        w: &mut impl Write,
+        from: Option<&TState>,
+        input: &TAlphabet,
+        to: Option<&TState>,
+    ) -> io::Result<()>;
+
+    /// Format the custom data associated with a state.
+    ///
+    /// This will be inside an [HTML
+    /// label](https://www.graphviz.org/doc/info/shapes.html#html), so you may
+    /// use balanced HTML tags.
+    fn fmt_state(&self, w: &mut impl Write, state: &TState) -> io::Result<()>;
+
+    /// Format a transition's output or the final output of a final state.
+    ///
+    /// This will be inside an [HTML
+    /// label](https://www.graphviz.org/doc/info/shapes.html#html), so you may
+    /// use balanced HTML tags.
+    fn fmt_output(&self, w: &mut impl Write, output: &TOutput) -> io::Result<()>;
+}
+
+impl<TAlphabet, TState, TOutput> Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Write this `Automaton` out as a [GraphViz
+    /// Dot](https://graphviz.gitlab.io/_pages/pdf/dotguide.pdf) file at the
+    /// given path.
+    ///
+    /// The `formatter` parameter controls how `TAlphabet`, `TState`, and
+    /// `TOutput` are rendered. See the [`DotFmt`][crate::dot::DotFmt] trait for
+    /// details.
+    ///
+    /// **This method only exists when the `"dot"` cargo feature is enabled.**
+    pub fn write_dot_file(
+        &self,
+        formatter: &impl DotFmt<TAlphabet, TState, TOutput>,
+        path: impl AsRef<Path>,
+    ) -> io::Result<()> {
+        let mut file = fs::File::create(path)?;
+        self.write_dot(formatter, &mut file)?;
+        Ok(())
+    }
+
+    /// Write this `Automaton` out to the given write-able as a [GraphViz
+    /// Dot](https://graphviz.gitlab.io/_pages/pdf/dotguide.pdf) file.
+    ///
+    /// The `formatter` parameter controls how `TAlphabet`, `TState`, and
+    /// `TOutput` are rendered. See the [`DotFmt`][crate::dot::DotFmt] trait for
+    /// details.
+    ///
+    /// **This method only exists when the `"dot"` cargo feature is enabled.**
+    pub fn write_dot(
+        &self,
+        formatter: &impl DotFmt<TAlphabet, TState, TOutput>,
+        w: &mut impl Write,
+    ) -> io::Result<()> {
+        writeln!(w, "digraph {{")?;
+        writeln!(w, "  rankdir = \"LR\";")?;
+        writeln!(w, "  nodesep = 2;")?;
+
+        // Fake state for the incoming arrow to the start state.
+        writeln!(w, "  \"\" [shape = none];")?;
+
+        // Each state, its associated custom data, and its final output.
+        for (i, state_data) in self.state_data.iter().enumerate() {
+            write!(
+                w,
+                r#"  state_{i} [shape = {shape}, label = <<table border="0"><tr><td cellpadding="5">{i}</td></tr><tr><td cellpadding="5">"#,
+                i = i,
+                shape = if self.final_states.contains_key(&State(i as u32)) {
+                    "doublecircle"
+                } else {
+                    "circle"
+                }
+            )?;
+            if let Some(state_data) = state_data {
+                formatter.fmt_state(w, state_data)?;
+            } else {
+                write!(w, "(no state data)")?;
+            }
+            write!(w, "</td></tr>")?;
+            if let Some(final_output) = self.final_states.get(&State(i as u32)) {
+                write!(w, r#"<tr><td cellpadding="5" align="left">"#)?;
+                formatter.fmt_output(w, final_output)?;
+                write!(w, "</td></tr>")?;
+            }
+            writeln!(w, "</table>>];")?;
+        }
+
+        // Fake transition to the start state.
+        writeln!(w, r#"  "" -> state_{};"#, self.start_state.0)?;
+
+        // Transitions between states and their outputs.
+        for (from, transitions) in self.transitions.iter().enumerate() {
+            for (input, (to, output)) in transitions {
+                write!(
+                    w,
+                    r#"  state_{from} -> state_{to} [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left">"#,
+                    from = from,
+                    to = to.0,
+                )?;
+                formatter.fmt_transition(
+                    w,
+                    self.state_data[from].as_ref(),
+                    input,
+                    self.state_data[to.0 as usize].as_ref(),
+                )?;
+                write!(
+                    w,
+                    r#"</td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left">"#,
+                )?;
+                formatter.fmt_output(w, output)?;
+                writeln!(w, "</td></tr></table>>];")?;
+            }
+        }
+
+        writeln!(w, "}}")?;
+        Ok(())
+    }
+}
+
+/// Format an `Automaton`'s `TAlphabet`, `TState`, and `TOutput` with their
+/// `std::fmt::Debug` implementations.
+#[derive(Debug)]
+pub struct DebugDotFmt;
+
+impl<TAlphabet, TState, TOutput> DotFmt<TAlphabet, TState, TOutput> for DebugDotFmt
+where
+    TAlphabet: Debug,
+    TState: Debug,
+    TOutput: Debug,
+{
+    fn fmt_transition(
+        &self,
+        w: &mut impl Write,
+        _from: Option<&TState>,
+        input: &TAlphabet,
+        _to: Option<&TState>,
+    ) -> io::Result<()> {
+        write!(w, r#"<font face="monospace">{:?}</font>"#, input)
+    }
+
+    fn fmt_state(&self, w: &mut impl Write, state: &TState) -> io::Result<()> {
+        write!(w, r#"<font face="monospace">{:?}</font>"#, state)
+    }
+
+    fn fmt_output(&self, w: &mut impl Write, output: &TOutput) -> io::Result<()> {
+        write!(w, r#"<font face="monospace">{:?}</font>"#, output)
+    }
+}
+
+/// Format an `Automaton`'s `TAlphabet`, `TState`, and `TOutput` with their
+/// `std::fmt::Display` implementations.
+#[derive(Debug)]
+pub struct DisplayDotFmt;
+
+impl<TAlphabet, TState, TOutput> DotFmt<TAlphabet, TState, TOutput> for DisplayDotFmt
+where
+    TAlphabet: Display,
+    TState: Display,
+    TOutput: Display,
+{
+    fn fmt_transition(
+        &self,
+        w: &mut impl Write,
+        _from: Option<&TState>,
+        input: &TAlphabet,
+        _to: Option<&TState>,
+    ) -> io::Result<()> {
+        write!(w, "{}", input)
+    }
+
+    fn fmt_state(&self, w: &mut impl Write, state: &TState) -> io::Result<()> {
+        write!(w, "{}", state)
+    }
+
+    fn fmt_output(&self, w: &mut impl Write, output: &TOutput) -> io::Result<()> {
+        write!(w, "{}", output)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::Builder;
+
+    #[test]
+    fn test_write_dot() {
+        let mut builder = Builder::<char, (), u64>::new();
+
+        // Insert "mon" -> 1
+        let mut insertion = builder.insert();
+        insertion.next('m', 1).next('o', 0).next('n', 0);
+        insertion.finish();
+
+        // Insert "sat" -> 6
+        let mut insertion = builder.insert();
+        insertion.next('s', 6).next('a', 0).next('t', 0);
+        insertion.finish();
+
+        // Insert "sun" -> 0
+        let mut insertion = builder.insert();
+        insertion.next('s', 0).next('u', 0).next('n', 0);
+        insertion.finish();
+
+        let automata = builder.finish();
+
+        let expected = r#"
+digraph {
+  rankdir = "LR";
+  nodesep = 2;
+  "" [shape = none];
+  state_0 [shape = doublecircle, label = <<table border="0"><tr><td cellpadding="5">0</td></tr><tr><td cellpadding="5">(no state data)</td></tr><tr><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+  state_1 [shape = circle, label = <<table border="0"><tr><td cellpadding="5">1</td></tr><tr><td cellpadding="5">(no state data)</td></tr></table>>];
+  state_2 [shape = circle, label = <<table border="0"><tr><td cellpadding="5">2</td></tr><tr><td cellpadding="5">(no state data)</td></tr></table>>];
+  state_3 [shape = circle, label = <<table border="0"><tr><td cellpadding="5">3</td></tr><tr><td cellpadding="5">(no state data)</td></tr></table>>];
+  state_4 [shape = circle, label = <<table border="0"><tr><td cellpadding="5">4</td></tr><tr><td cellpadding="5">(no state data)</td></tr></table>>];
+  state_5 [shape = circle, label = <<table border="0"><tr><td cellpadding="5">5</td></tr><tr><td cellpadding="5">(no state data)</td></tr></table>>];
+  "" -> state_5;
+  state_1 -> state_0 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'n'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+  state_2 -> state_1 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'o'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+  state_3 -> state_0 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'t'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+  state_4 -> state_3 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'a'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">6</font></td></tr></table>>];
+  state_4 -> state_1 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'u'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+  state_5 -> state_2 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'m'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">1</font></td></tr></table>>];
+  state_5 -> state_4 [label = <<table border="0"><tr><td cellpadding="5" align="left">Input:</td><td cellpadding="5" align="left"><font face="monospace">'s'</font></td></tr><tr><td cellpadding="5" align="left">Output:</td><td cellpadding="5" align="left"><font face="monospace">0</font></td></tr></table>>];
+}
+"#;
+
+        let mut buf = vec![];
+        automata.write_dot(&DebugDotFmt, &mut buf).unwrap();
+        let actual = String::from_utf8(buf).unwrap();
+        eprintln!("{}", actual);
+        assert_eq!(expected.trim(), actual.trim());
+    }
+}
diff --git a/cranelift/peepmatic/crates/automata/src/lib.rs b/cranelift/peepmatic/crates/automata/src/lib.rs
new file mode 100644
index 0000000000..6ed09a66e3
--- /dev/null
+++ b/cranelift/peepmatic/crates/automata/src/lib.rs
@@ -0,0 +1,1024 @@
+//! Finite-state transducer automata.
+//!
+//! A transducer is a type of automata that has not only an input that it
+//! accepts or rejects, but also an output. While regular automata check whether
+//! an input string is in the set that the automata accepts, a transducer maps
+//! the input strings to values. A regular automata is sort of a compressed,
+//! immutable set, and a transducer is sort of a compressed, immutable key-value
+//! dictionary. A [trie] compresses a set of strings or map from a string to a
+//! value by sharing prefixes of the input string. Automata and transducers can
+//! compress even better: they can share both prefixes and suffixes. [*Index
+//! 1,600,000,000 Keys with Automata and Rust* by Andrew Gallant (aka
+//! burntsushi)][burntsushi-blog-post] is a top-notch introduction.
+//!
+//! If you're looking for a general-purpose transducers crate in Rust you're
+//! probably looking for [the `fst` crate][fst-crate]. While this implementation
+//! is fully generic and has no dependencies, its feature set is specific to
+//! `peepmatic`'s needs:
+//!
+//! * We need to associate extra data with each state: the match operation to
+//!   evaluate next.
+//!
+//! * We can't provide the full input string up front, so this crate must
+//!   support incremental lookups. This is because the peephole optimizer is
+//!   computing the input string incrementally and dynamically: it looks at the
+//!   current state's match operation, evaluates it, and then uses the result as
+//!   the next character of the input string.
+//!
+//! * We also support incremental insertion and output when building the
+//!   transducer. This is necessary because we don't want to emit output values
+//!   that bind a match on an optimization's left-hand side's pattern (for
+//!   example) until after we've succeeded in matching it, which might not
+//!   happen until we've reached the n^th state.
+//!
+//! * We need to support generic output values. The `fst` crate only supports
+//!   `u64` outputs, while we need to build up an optimization's right-hand side
+//!   instructions.
+//!
+//! This implementation is based on [*Direct Construction of Minimal Acyclic
+//! Subsequential Transducers* by Mihov and Maurel][paper]. That means that keys
+//! must be inserted in lexicographic order during construction.
+//!
+//! [trie]: https://en.wikipedia.org/wiki/Trie
+//! [burntsushi-blog-post]: https://blog.burntsushi.net/transducers/#ordered-maps
+//! [fst-crate]: https://crates.io/crates/fst
+//! [paper]: http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.24.3698&rep=rep1&type=pdf
+
+#![deny(missing_debug_implementations)]
+#![deny(missing_docs)]
+
+mod output_impls;
+
+#[cfg(feature = "serde")]
+mod serde_impls;
+
+#[cfg(feature = "dot")]
+pub mod dot;
+
+use std::collections::{BTreeMap, HashMap, HashSet};
+use std::convert::TryInto;
+use std::hash::Hash;
+use std::iter;
+use std::mem;
+
+/// An output type for a transducer automata.
+///
+/// Not every type can be the output of a transducer. For correctness (not
+/// memory safety) each type that implements this trait must satisfy the
+/// following laws:
+///
+/// 1. `concat(empty(), x) == x` -- concatenating something with the empty
+///    instance produces that same something.
+///
+/// 2. `prefix(a, b) == prefix(b, a)` -- taking the prefix of two instances is
+///    commutative.
+///
+/// 3. `prefix(empty(), x) == empty()` -- the prefix of any value and the empty
+///    instance is the empty instance.
+///
+/// 4. `difference(concat(a, b), a) == b` -- concatenating a prefix value and
+///    then removing it is the identity function.
+///
+/// ## Example
+///
+/// Here is an example implementation for unsigned integers:
+///
+/// ```
+/// use peepmatic_automata::Output;
+///
+/// #[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
+/// struct MyInt(u64);
+///
+/// impl Output for MyInt {
+///     // The empty value is zero.
+///     fn empty() -> Self {
+///         MyInt(0)
+///     }
+///
+///     // The prefix of two values is their min.
+///     fn prefix(a: &MyInt, b: &MyInt) -> Self {
+///         std::cmp::min(*a, *b)
+///     }
+///
+///     // The difference is subtraction.
+///     fn difference(a: &MyInt, b: &MyInt) -> Self {
+///         MyInt(a.0 - b.0)
+///     }
+///
+///     // Concatenation is addition.
+///     fn concat(a: &MyInt, b: &MyInt) -> Self {
+///         MyInt(a.0 + b.0)
+///     }
+/// }
+///
+/// // Law 1
+/// assert_eq!(
+///     MyInt::concat(&MyInt::empty(), &MyInt(5)),
+///     MyInt(5),
+/// );
+///
+/// // Law 2
+/// assert_eq!(
+///     MyInt::prefix(&MyInt(3), &MyInt(5)),
+///     MyInt::prefix(&MyInt(5), &MyInt(3))
+/// );
+///
+/// // Law 3
+/// assert_eq!(
+///     MyInt::prefix(&MyInt::empty(), &MyInt(5)),
+///     MyInt::empty()
+/// );
+///
+/// // Law 4
+/// assert_eq!(
+///     MyInt::difference(&MyInt::concat(&MyInt(2), &MyInt(3)), &MyInt(2)),
+///     MyInt(3),
+/// );
+/// ```
+pub trait Output: Sized + Eq + Hash + Clone {
+    /// Construct the empty instance.
+    fn empty() -> Self;
+
+    /// Is this the empty instance?
+    ///
+    /// The default implementation constructs the empty instance and then checks
+    /// if `self` is equal to it. Override this default if you can provide a
+    /// better implementation.
+    fn is_empty(&self) -> bool {
+        *self == Self::empty()
+    }
+
+    /// Get the shared prefix of two instances.
+    ///
+    /// This must be commutative.
+    fn prefix(a: &Self, b: &Self) -> Self;
+
+    /// When `b` is a prefix of `a`, get the remaining suffix of `a` that is not
+    /// shared with `b`.
+    fn difference(a: &Self, b: &Self) -> Self;
+
+    /// Concatenate `a` and `b`.
+    fn concat(a: &Self, b: &Self) -> Self;
+}
+
+/// A builder for a transducer automata.
+///
+/// ## Type Parameters
+///
+/// Generic over the following parameters:
+///
+/// * `TAlphabet` -- the alphabet of the input strings. If your input keys are
+///   `String`s, this would be `char`. If your input keys are arbitrary byte
+///   strings, this would be `u8`.
+///
+/// * `TState` -- extra, custom data associated with each state. This isn't used
+///   by the automata itself, but you can use it to annotate states with extra
+///   information for your own purposes.
+///
+/// * `TOutput` -- the output type. See [the `Output` trait][crate::Output] for
+///   the requirements that any output type must fulfill.
+///
+/// ## Insertions
+///
+/// Insertions *must* happen in lexicographic order. Failure to do this, or
+/// inserting duplicates, will trigger panics.
+///
+/// ## Example
+///
+/// ```
+/// use peepmatic_automata::Builder;
+///
+/// let mut builder = Builder::<u8, (), u64>::new();
+///
+/// // Insert "mon" -> 1
+/// let mut insertion = builder.insert();
+/// insertion
+///     .next(b'm', 1)
+///     .next(b'o', 0)
+///     .next(b'n', 0);
+/// insertion.finish();
+///
+/// // Insert "sat" -> 6
+/// let mut insertion = builder.insert();
+/// insertion
+///     .next(b's', 6)
+///     .next(b'a', 0)
+///     .next(b't', 0);
+/// insertion.finish();
+///
+/// // Insert "sun" -> 0
+/// let mut insertion = builder.insert();
+/// insertion
+///     .next(b's', 0)
+///     .next(b'u', 0)
+///     .next(b'n', 0);
+/// insertion.finish();
+///
+/// let automata = builder.finish();
+///
+/// assert_eq!(automata.get(b"sun"), Some(0));
+/// assert_eq!(automata.get(b"mon"), Some(1));
+/// assert_eq!(automata.get(b"sat"), Some(6));
+///
+/// assert!(automata.get(b"tues").is_none());
+/// ```
+#[derive(Debug, Clone)]
+pub struct Builder<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    inner: Option<BuilderInner<TAlphabet, TState, TOutput>>,
+}
+
+impl<TAlphabet, TState, TOutput> Builder<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Make a new builder to start constructing a new transducer automata.
+    pub fn new() -> Self {
+        let mut inner = BuilderInner {
+            frozen: vec![],
+            wip: BTreeMap::new(),
+            wip_state_id_counter: 0,
+            unfinished: vec![],
+            already_frozen: HashMap::new(),
+            last_insertion_finished: true,
+        };
+
+        // Create the start state.
+        let id = inner.new_wip_state();
+        inner.unfinished.push(id);
+
+        Builder { inner: Some(inner) }
+    }
+
+    fn inner(&mut self) -> &mut BuilderInner<TAlphabet, TState, TOutput> {
+        self.inner
+            .as_mut()
+            .expect("cannot use `Builder` anymore after calling `finish` on it")
+    }
+
+    /// Start building a new key/value insertion.
+    ///
+    /// Insertions are built up incrementally, and a full entry is created from
+    /// a series of `TAlphabet` and `TOutput` pairs passed to
+    /// [`InsertionBuilder::next`][crate::InsertionBuilder::next].
+    ///
+    /// ## Panics
+    ///
+    /// Panics if [`finish`][crate::InsertionBuilder::finish] was not called on
+    /// the last `InsertionBuilder` returned from this method.
+    pub fn insert(&mut self) -> InsertionBuilder<TAlphabet, TState, TOutput> {
+        let inner = self.inner();
+        assert!(
+            inner.last_insertion_finished,
+            "did not call `finish` on the last `InsertionBuilder`"
+        );
+        inner.last_insertion_finished = false;
+        InsertionBuilder {
+            inner: inner,
+            index: 0,
+            output: TOutput::empty(),
+        }
+    }
+
+    /// Finish building this transducer and return the constructed `Automaton`.
+    ///
+    /// ## Panics
+    ///
+    /// Panics if this builder is empty, and has never had anything inserted
+    /// into it.
+    ///
+    /// Panics if the last insertion's
+    /// [`InsertionBuilder`][crate::InsertionBuilder] did not call its
+    /// [finish][crate::InsertionBuilder::finish] method.
+    pub fn finish(&mut self) -> Automaton<TAlphabet, TState, TOutput> {
+        let mut inner = self
+            .inner
+            .take()
+            .expect("cannot use `Builder` anymore after calling `finish` on it");
+        assert!(inner.last_insertion_finished);
+
+        let wip_start = inner.unfinished[0];
+
+        // Freeze everything! We're done!
+        let wip_to_frozen = inner.freeze_from(0);
+        assert!(inner.wip.is_empty());
+        assert!(inner.unfinished.is_empty());
+
+        // Now transpose our states and transitions into our packed,
+        // struct-of-arrays representation that we use inside `Automaton`.
+        let FrozenStateId(s) = wip_to_frozen[&wip_start];
+        let start_state = State(s);
+        let mut state_data = vec![None; inner.frozen.len()];
+        let mut transitions = (0..inner.frozen.len())
+            .map(|_| BTreeMap::new())
+            .collect::<Vec<_>>();
+        let mut final_states = BTreeMap::new();
+
+        assert!((inner.frozen.len() as u64) < (std::u32::MAX as u64));
+        for (i, state) in inner.frozen.into_iter().enumerate() {
+            assert!(state_data[i].is_none());
+            assert!(transitions[i].is_empty());
+
+            state_data[i] = state.state_data;
+
+            for (input, (FrozenStateId(to_state), output)) in state.transitions {
+                assert!((to_state as usize) < transitions.len());
+                transitions[i].insert(input, (State(to_state), output));
+            }
+
+            if state.is_final {
+                final_states.insert(State(i as u32), state.final_output);
+            } else {
+                assert!(state.final_output.is_empty());
+            }
+        }
+
+        let automata = Automaton {
+            state_data,
+            transitions,
+            final_states,
+            start_state,
+        };
+
+        #[cfg(debug_assertions)]
+        {
+            if let Err(msg) = automata.check_representation() {
+                panic!("Automaton::check_representation failed: {}", msg);
+            }
+        }
+
+        automata
+    }
+}
+
+/// A state in an automaton.
+///
+/// Only use a `State` with the automaton that it came from! Mixing and matching
+/// states between automata will result in bogus results and/or panics!
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Ord, PartialOrd)]
+pub struct State(u32);
+
+#[derive(Clone, Debug)]
+struct BuilderInner<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    // The `i`th entry maps `FrozenStateId(i)` to its state.
+    frozen: Vec<FrozenState<TAlphabet, TState, TOutput>>,
+
+    // Our mutable, work-in-progress states.
+    wip: BTreeMap<WipStateId, WipState<TAlphabet, TState, TOutput>>,
+
+    // A counter for WIP state ids.
+    wip_state_id_counter: u32,
+
+    // A stack of our work-in-progress states.
+    unfinished: Vec<WipStateId>,
+
+    // A map from `WipState`s that we've already frozen to their canonical,
+    // de-duplicated frozen state. This is used for hash-consing frozen states
+    // so that we share suffixes in the automata.
+    already_frozen: HashMap<WipState<TAlphabet, TState, TOutput>, FrozenStateId>,
+
+    // The the last `InsertionBuilder` have its `finish` method invoked?
+    last_insertion_finished: bool,
+}
+
+impl<TAlphabet, TState, TOutput> BuilderInner<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    fn new_wip_state(&mut self) -> WipStateId {
+        let id = WipStateId(self.wip_state_id_counter);
+        self.wip_state_id_counter += 1;
+        let old = self.wip.insert(
+            id,
+            WipState {
+                state_data: None,
+                transitions: BTreeMap::new(),
+                is_final: false,
+                final_output: TOutput::empty(),
+            },
+        );
+        debug_assert!(old.is_none());
+        id
+    }
+
+    fn freeze_from(&mut self, index: usize) -> BTreeMap<WipStateId, FrozenStateId> {
+        assert!(index <= self.unfinished.len());
+
+        let mut wip_to_frozen = BTreeMap::new();
+
+        if index == self.unfinished.len() {
+            // Nothing to freeze.
+            return wip_to_frozen;
+        }
+
+        // Freeze `self.inner.unfinished[self.index + 1..]` from the end
+        // back. We're essentially hash-consing each state.
+        for _ in (index..self.unfinished.len()).rev() {
+            let wip_id = self.unfinished.pop().unwrap();
+            let mut wip = self.wip.remove(&wip_id).unwrap();
+
+            // Update transitions to any state we just froze in an earlier
+            // iteration of this loop.
+            wip.update_transitions(&wip_to_frozen);
+
+            // Get or create the canonical frozen state for this WIP state.
+            //
+            // Note: we're not using the entry API here because this way we can
+            // avoid cloning `wip`, which would be more costly than the double
+            // lookup we're doing instead.
+            let frozen_id = if let Some(id) = self.already_frozen.get(&wip) {
+                *id
+            } else {
+                let id = FrozenStateId(self.frozen.len().try_into().unwrap());
+                self.frozen.push(FrozenState {
+                    state_data: wip.state_data.clone(),
+                    transitions: wip
+                        .transitions
+                        .clone()
+                        .into_iter()
+                        .map(|(input, (id, output))| {
+                            let id = match id {
+                                WipOrFrozenStateId::Frozen(id) => id,
+                                WipOrFrozenStateId::Wip(_) => panic!(
+                                    "when we are freezing a WIP state, it should never have \
+                                     any transitions to another WIP state"
+                                ),
+                            };
+                            (input, (id, output))
+                        })
+                        .collect(),
+                    is_final: wip.is_final,
+                    final_output: wip.final_output.clone(),
+                });
+                self.already_frozen.insert(wip, id);
+                id
+            };
+
+            // Record the id for this newly frozen state, so that other states
+            // which referenced it when it wasn't frozen can reference it as a
+            // frozen state.
+            wip_to_frozen.insert(wip_id, frozen_id);
+        }
+
+        // Update references to newly frozen states from the rest of the
+        // unfinished stack that we didn't freeze.
+        for wip_id in &self.unfinished {
+            self.wip
+                .get_mut(wip_id)
+                .unwrap()
+                .update_transitions(&wip_to_frozen);
+        }
+
+        wip_to_frozen
+    }
+}
+
+/// A builder for a new entry in a transducer automata.
+#[derive(Debug)]
+pub struct InsertionBuilder<'a, TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    inner: &'a mut BuilderInner<TAlphabet, TState, TOutput>,
+
+    // The index within `inner.unfinished` where we will transition out of next.
+    index: usize,
+
+    // Any leftover output from the last transition that we need to roll over
+    // into the next transition.
+    output: TOutput,
+}
+
+impl<'a, TAlphabet, TState, TOutput> InsertionBuilder<'a, TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Insert the next character of input for this entry, and the associated
+    /// output that should be emitted along with it.
+    ///
+    /// In general, you want to add all of your output on the very first `next`
+    /// call, and use [`Output::empty()`][crate::Output::empty] for all the
+    /// rest. This enables the most tail-sharing of suffixes, which leads to the
+    /// most compact automatas.
+    ///
+    /// However, there are times when you *cannot* emit output yet, as it
+    /// depends on having moved throught he automata further. For example, with
+    /// `peepmatic` we cannot bind something from an optimization's left-hand
+    /// side's pattern until after we know it exists, which only happens after
+    /// we've moved some distance through the automata.
+    pub fn next(&mut self, input: TAlphabet, output: TOutput) -> &mut Self {
+        assert!(self.index < self.inner.unfinished.len());
+
+        if output.is_empty() {
+            // Leave `self.output` as it is.
+        } else if self.output.is_empty() {
+            self.output = output;
+        } else {
+            self.output = TOutput::concat(&self.output, &output);
+        }
+
+        let wip_id = self.inner.unfinished[self.index];
+        let wip = self.inner.wip.get_mut(&wip_id).unwrap();
+
+        match wip.transitions.get_mut(&input) {
+            Some((WipOrFrozenStateId::Frozen(_), _)) => {
+                panic!("out of order insertion: wip->frozen edge in shared prefix")
+            }
+
+            // We're still in a shared prefix with the last insertion. That
+            // means that the state we are transitioning to must be the next
+            // state in `unfinished`. All we have to do is make sure the
+            // transition's output is the common prefix of the this insertion
+            // and the last, and push any excess suffix output out to other
+            // transition edges.
+            Some((WipOrFrozenStateId::Wip(next_id), out)) => {
+                let next_id = *next_id;
+                assert_eq!(next_id, self.inner.unfinished[self.index + 1]);
+
+                // Find the common prefix of `out` and `self.output`.
+                let prefix = TOutput::prefix(&self.output, out);
+
+                // Carry over this key's suffix for the next input's transition.
+                self.output = TOutput::difference(&self.output, &prefix);
+
+                let rest = TOutput::difference(out, &prefix);
+                *out = prefix;
+
+                let next_wip = self.inner.wip.get_mut(&next_id).unwrap();
+
+                // Push the leftover suffix of `out` along its other
+                // transitions. As a small optimization, only iterate over the
+                // edges if there is a non-empty value to push out along them.
+                if !rest.is_empty() {
+                    if next_wip.is_final {
+                        next_wip.final_output = TOutput::concat(&rest, &next_wip.final_output);
+                    }
+                    for (_input, (_state, output)) in &mut next_wip.transitions {
+                        *output = TOutput::concat(&rest, output);
+                    }
+                }
+            }
+
+            // We've diverged from the shared prefix with the last
+            // insertion. Freeze the last insertion's unshared suffix and create
+            // a new WIP state for us to transition into.
+            None => {
+                self.inner.freeze_from(self.index + 1);
+
+                let output = mem::replace(&mut self.output, TOutput::empty());
+
+                let new_id = self.inner.new_wip_state();
+                self.inner.unfinished.push(new_id);
+                self.inner
+                    .wip
+                    .get_mut(&wip_id)
+                    .unwrap()
+                    .transitions
+                    .insert(input, (WipOrFrozenStateId::Wip(new_id), output));
+            }
+        }
+
+        self.index += 1;
+        assert!(self.index < self.inner.unfinished.len());
+
+        self
+    }
+
+    /// Finish this insertion.
+    ///
+    /// Failure to call this method before this `InsertionBuilder` is dropped
+    /// means that the insertion is *not* committed in the builder, and future
+    /// calls to [`InsertionBuilder::next`][crate::InsertionBuilder::next] will
+    /// panic!
+    pub fn finish(self) {
+        assert!(!self.inner.unfinished.is_empty());
+        assert_eq!(
+            self.index,
+            self.inner.unfinished.len() - 1,
+            "out of order insertion"
+        );
+
+        let wip_id = *self.inner.unfinished.last().unwrap();
+        let wip = self.inner.wip.get_mut(&wip_id).unwrap();
+        wip.is_final = true;
+        wip.final_output = self.output;
+
+        self.inner.last_insertion_finished = true;
+    }
+
+    /// Set the optional, custom data for the current state.
+    ///
+    /// If you assign different state data to two otherwise-identical states
+    /// within the same shared *prefix* during insertion, it is implementation
+    /// defined which state and custom state data is kept.
+    ///
+    /// For *suffixes*, assigning different state data to two
+    /// otehrwise-identical states will result in the duplication of those
+    /// states: they won't get de-duplicated.
+    pub fn set_state_data(&mut self, data: TState) -> &mut Self {
+        assert!(self.index < self.inner.unfinished.len());
+        let id = self.inner.unfinished[self.index];
+        self.inner.wip.get_mut(&id).unwrap().state_data = Some(data);
+        self
+    }
+
+    /// Get the current state's optional, custom data, if any.
+    ///
+    /// For shared prefixes, this may return state data that was assigned to an
+    /// equivalent state that was added earlier in the build process.
+    pub fn get_state_data(&self) -> Option<&TState> {
+        let id = self.inner.unfinished[self.index];
+        self.inner.wip.get(&id).unwrap().state_data.as_ref()
+    }
+}
+
+/// The id of an immutable, frozen state.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
+struct FrozenStateId(u32);
+
+/// The id of a mutable, work-in-progress state.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
+struct WipStateId(u32);
+
+/// The id of either a frozen or a WIP state.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
+enum WipOrFrozenStateId {
+    Wip(WipStateId),
+    Frozen(FrozenStateId),
+}
+
+/// A frozen, immutable state inside a `Builder`.
+///
+/// These states are from earlier in the lexicographic sorting on input keys,
+/// and have already been processed.
+#[derive(Clone, Debug, Hash)]
+struct FrozenState<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    state_data: Option<TState>,
+    transitions: BTreeMap<TAlphabet, (FrozenStateId, TOutput)>,
+    is_final: bool,
+    final_output: TOutput,
+}
+
+/// A mutable, work-in-progress state inside a `Builder`.
+///
+/// These states only exist for the last-inserted and currently-being-inserted
+/// input keys. As soon as we find the end of their shared prefix, the last
+/// key's unshared suffix is frozen, and then only the currently-being-inserted
+/// input key has associated WIP states.
+#[derive(Clone, Debug, PartialEq, Eq, Hash)]
+struct WipState<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    state_data: Option<TState>,
+    transitions: BTreeMap<TAlphabet, (WipOrFrozenStateId, TOutput)>,
+    is_final: bool,
+    final_output: TOutput,
+}
+
+impl<TAlphabet, TState, TOutput> WipState<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Given that we froze some old, WIP state, update any transitions out of
+    /// this WIP state so they point to the new, frozen state.
+    fn update_transitions(&mut self, wip_to_frozen: &BTreeMap<WipStateId, FrozenStateId>) {
+        for (to, _) in self.transitions.values_mut() {
+            if let WipOrFrozenStateId::Wip(w) = *to {
+                if let Some(f) = wip_to_frozen.get(&w) {
+                    *to = WipOrFrozenStateId::Frozen(*f);
+                }
+            }
+        }
+    }
+}
+
+/// A finite-state transducer automata.
+///
+/// These are constructed via [`Builder`][crate::Builder].
+///
+/// An `Automaton` is immutable: new entries cannot be inserted and existing
+/// entries cannot be removed.
+///
+/// To query an `Automaton`, there are two APIs:
+///
+/// 1. [`get`][crate::Automaton::get] -- a high-level method to get the associated
+///    output value of a full input sequence.
+///
+/// 2. [`query`][crate::Automaton::query] -- a low-level method to
+///    incrementally query the automata. It does not require that you have the
+///    full input sequence on hand all at once, only the next character. It also
+///    allows you to process the output as it it built up, rather than only at
+///    giving you the final, complete output value.
+#[derive(Debug, Clone)]
+pub struct Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    // The `i`th entry is `State(i)`'s associated custom data.
+    state_data: Vec<Option<TState>>,
+
+    // The `i`th entry contains `State(i)`'s transitions.
+    transitions: Vec<BTreeMap<TAlphabet, (State, TOutput)>>,
+
+    // Keeps track of which states are final, and if so, what their final output
+    // is.
+    final_states: BTreeMap<State, TOutput>,
+
+    // The starting state.
+    start_state: State,
+}
+
+impl<TAlphabet, TState, TOutput> Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Get the output value associated with the given input sequence.
+    ///
+    /// Returns `None` if the input sequence is not a member of this
+    /// `Automaton`'s keys. Otherwise, returns `Some(output)`.
+    pub fn get<'a>(&self, input: impl IntoIterator<Item = &'a TAlphabet>) -> Option<TOutput>
+    where
+        TAlphabet: 'a,
+    {
+        let mut query = self.query();
+        let mut output = TOutput::empty();
+
+        for inp in input {
+            let this_out = query.next(inp)?;
+            output = TOutput::concat(&output, &this_out);
+        }
+
+        let final_output = query.finish()?;
+        Some(TOutput::concat(&output, final_output))
+    }
+
+    /// Create a low-level query.
+    ///
+    /// This allows you to incrementally query this `Automaton`, without
+    /// providing the full input sequence ahead of time, and also incrementally
+    /// build up the output.
+    ///
+    /// See [`Query`][crate::Query] for details.
+    pub fn query(&self) -> Query<TAlphabet, TState, TOutput> {
+        Query {
+            automata: self,
+            current_state: self.start_state,
+        }
+    }
+
+    /// Check that the internal representaton is OK.
+    ///
+    /// Checks that we don't have any transitions to unknown states, that there
+    /// aren't any cycles, that ever path through the automata eventually ends
+    /// in a final state, etc.
+    ///
+    /// This property is `debug_assert!`ed in `Builder::finish`, and checked
+    /// when deserializing an `Automaton`.
+    ///
+    /// Returns `true` if the representation is okay, `false` otherwise.
+    fn check_representation(&self) -> Result<(), &'static str> {
+        macro_rules! bail_if {
+            ($condition:expr, $msg:expr) => {
+                if $condition {
+                    return Err($msg);
+                }
+            };
+        }
+
+        bail_if!(
+            self.state_data.len() != self.transitions.len(),
+            "different number of states and transition sets"
+        );
+        bail_if!(
+            self.final_states.is_empty(),
+            "the set of final states is empty"
+        );
+
+        bail_if!(
+            (self.start_state.0 as usize) >= self.transitions.len(),
+            "the start state is not a valid state"
+        );
+
+        for (f, _out) in &self.final_states {
+            bail_if!(
+                (f.0 as usize) >= self.transitions.len(),
+                "one of the final states is not a valid state"
+            );
+        }
+
+        // Walk the state transition graph and ensure that
+        //
+        // 1. there are no cycles, and
+        //
+        // 2. every path ends in a final state.
+        let mut on_stack = HashSet::new();
+        let mut stack = vec![
+            (Traversal::Stop, self.start_state),
+            (Traversal::Start, self.start_state),
+        ];
+        loop {
+            match stack.pop() {
+                None => break,
+                Some((Traversal::Start, state)) => {
+                    let is_new = on_stack.insert(state);
+                    debug_assert!(is_new);
+
+                    let mut has_any_transitions = false;
+                    for (_input, (to_state, _output)) in &self.transitions[state.0 as usize] {
+                        has_any_transitions = true;
+
+                        // A transition to a state that we walked through to get
+                        // here means that there is a cycle.
+                        bail_if!(
+                            on_stack.contains(to_state),
+                            "there is a cycle in the state transition graph"
+                        );
+
+                        stack.extend(
+                            iter::once((Traversal::Stop, *to_state))
+                                .chain(iter::once((Traversal::Start, *to_state))),
+                        );
+                    }
+
+                    if !has_any_transitions {
+                        // All paths must end in a final state.
+                        bail_if!(
+                            !self.final_states.contains_key(&state),
+                            "a path through the state transition graph does not end in a final state"
+                        );
+                    }
+                }
+                Some((Traversal::Stop, state)) => {
+                    debug_assert!(on_stack.contains(&state));
+                    on_stack.remove(&state);
+                }
+            }
+        }
+
+        return Ok(());
+
+        enum Traversal {
+            Start,
+            Stop,
+        }
+    }
+}
+
+/// A low-level query of an `Automaton`.
+///
+/// This allows you to incrementally query an `Automaton`, without providing the
+/// full input sequence ahead of time, and also to incrementally build up the
+/// output.
+///
+/// The typical usage pattern is:
+///
+/// * First, a series of [`next`][crate::Query::next] calls that each provide
+///   one character of the input sequence.
+///
+///   If this query is still on a path towards a known entry of the
+///   automata, then `Some` is returned with the partial output of the
+///   transition that was just taken. Otherwise, `None` is returned, signifying
+///   that the input string has been rejected by the automata.
+///
+///   You may also inspect the current state's associated custom data, if any,
+///   in between `next` calls via the
+///   [`current_state_data`][crate::Query::current_state_data] method.
+///
+/// * When the input sequence is exhausted, call
+///   [`is_in_final_state`][crate::Query::is_in_final_state] to determine if this
+///   query is in a final state of the automata. If it is not, then the
+///   input string has been rejected by the automata.
+///
+/// * Given that the input sequence is exhausted, you may call
+///   [`finish`][crate::Query::finish] to get the final bit of partial output.
+#[derive(Debug, Clone)]
+pub struct Query<'a, TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    automata: &'a Automaton<TAlphabet, TState, TOutput>,
+    current_state: State,
+}
+
+impl<'a, TAlphabet, TState, TOutput> Query<'a, TAlphabet, TState, TOutput>
+where
+    TAlphabet: Clone + Eq + Hash + Ord,
+    TState: Clone + Eq + Hash,
+    TOutput: Output,
+{
+    /// Get the current state in the automaton that this query is at.
+    pub fn current_state(&self) -> State {
+        self.current_state
+    }
+
+    /// Move this query to the given state in the automaton.
+    ///
+    /// This can be used to implement backtracking, if you can also reset your
+    /// output to the way it was when you previously visited the given `State`.
+    ///
+    /// Only use a `State` that came from this query's automaton! Mixing and
+    /// matching states between automata will result in bogus results and/or
+    /// panics!
+    pub fn go_to_state(&mut self, state: State) {
+        assert!((state.0 as usize) < self.automata.transitions.len());
+        debug_assert_eq!(
+            self.automata.state_data.len(),
+            self.automata.transitions.len()
+        );
+        self.current_state = state;
+    }
+
+    /// Does the query's current state have a transition on the given input?
+    ///
+    /// Regardless whether a transition on the given input exists for the
+    /// current state or not, the query remains in the current state.
+    pub fn has_transition_on(&self, input: &TAlphabet) -> bool {
+        let State(i) = self.current_state;
+        self.automata.transitions[i as usize].contains_key(input)
+    }
+
+    /// Transition to the next state given the next input character, and return
+    /// the partial output for that transition.
+    ///
+    /// If `None` is returned, then the input sequence has been rejected by the
+    /// automata, and this query remains in its current state.
+    #[inline]
+    pub fn next(&mut self, input: &TAlphabet) -> Option<&'a TOutput> {
+        let State(i) = self.current_state;
+        match self.automata.transitions[i as usize].get(input) {
+            None => None,
+            Some((next_state, output)) => {
+                self.current_state = *next_state;
+                Some(output)
+            }
+        }
+    }
+
+    /// Get the current state's associated custom data, if any.
+    ///
+    /// See also
+    /// [`InsertionBuilder::set_state_data`][crate::InsertionBuilder::set_state_data].
+    #[inline]
+    pub fn current_state_data(&self) -> Option<&'a TState> {
+        let State(i) = self.current_state;
+        self.automata.state_data[i as usize].as_ref()
+    }
+
+    /// Is this query currently in a final state?
+    #[inline]
+    pub fn is_in_final_state(&self) -> bool {
+        self.automata.final_states.contains_key(&self.current_state)
+    }
+
+    /// Given that the input sequence is exhausted, get the final bit of partial
+    /// output.
+    ///
+    /// Returns `None` if this query is not currently in a final state, meaning
+    /// that the automata has rejected this input sequence. You can check
+    /// whether that is the case or not with the
+    /// [`is_in_final_state`][crate::Query::is_in_final_state] method.
+    pub fn finish(self) -> Option<&'a TOutput> {
+        self.automata.final_states.get(&self.current_state)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    #[test]
+    fn it_works() {
+        assert_eq!(2 + 2, 4);
+    }
+}
diff --git a/cranelift/peepmatic/crates/automata/src/output_impls.rs b/cranelift/peepmatic/crates/automata/src/output_impls.rs
new file mode 100644
index 0000000000..308c466d5b
--- /dev/null
+++ b/cranelift/peepmatic/crates/automata/src/output_impls.rs
@@ -0,0 +1,130 @@
+use crate::Output;
+use std::cmp;
+use std::hash::Hash;
+
+impl Output for u64 {
+    fn empty() -> Self {
+        0
+    }
+
+    fn prefix(a: &Self, b: &Self) -> Self {
+        cmp::min(*a, *b)
+    }
+
+    fn difference(a: &Self, b: &Self) -> Self {
+        a - b
+    }
+
+    fn concat(a: &Self, b: &Self) -> Self {
+        a + b
+    }
+}
+
+impl<T> Output for Vec<T>
+where
+    T: Clone + Eq + Hash,
+{
+    fn empty() -> Self {
+        vec![]
+    }
+
+    fn is_empty(&self) -> bool {
+        self.is_empty()
+    }
+
+    fn prefix(a: &Self, b: &Self) -> Self {
+        a.iter()
+            .cloned()
+            .zip(b.iter().cloned())
+            .take_while(|(a, b)| a == b)
+            .map(|(a, _)| a)
+            .collect()
+    }
+
+    fn difference(a: &Self, b: &Self) -> Self {
+        let i = a
+            .iter()
+            .zip(b.iter())
+            .position(|(a, b)| a != b)
+            .unwrap_or(cmp::min(a.len(), b.len()));
+        a[i..].to_vec()
+    }
+
+    fn concat(a: &Self, b: &Self) -> Self {
+        let mut c = a.clone();
+        c.extend(b.iter().cloned());
+        c
+    }
+}
+
+impl<T> Output for Box<[T]>
+where
+    T: Clone + Eq + Hash,
+{
+    fn empty() -> Self {
+        vec![].into_boxed_slice()
+    }
+
+    fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    fn prefix(a: &Self, b: &Self) -> Self {
+        a.iter()
+            .cloned()
+            .zip(b.iter().cloned())
+            .take_while(|(a, b)| a == b)
+            .map(|(a, _)| a)
+            .collect()
+    }
+
+    fn difference(a: &Self, b: &Self) -> Self {
+        let i = a
+            .iter()
+            .zip(b.iter())
+            .position(|(a, b)| a != b)
+            .unwrap_or(cmp::min(a.len(), b.len()));
+        a[i..].to_vec().into_boxed_slice()
+    }
+
+    fn concat(a: &Self, b: &Self) -> Self {
+        let mut c = a.clone().to_vec();
+        c.extend(b.iter().cloned());
+        c.into_boxed_slice()
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use crate::Output;
+    use std::fmt::Debug;
+
+    // Assert the laws that `Output` requires for correctness. `a` and `b`
+    // should be two different instances of an `Output` type.
+    fn assert_laws<O>(a: O, b: O)
+    where
+        O: Clone + Debug + Output,
+    {
+        // Law 1
+        assert_eq!(O::concat(&O::empty(), &a), a.clone());
+
+        // Law 2
+        assert_eq!(O::prefix(&b, &a), O::prefix(&a, &b));
+
+        // Law 3
+        assert_eq!(O::prefix(&O::empty(), &a), O::empty());
+
+        // Law 4
+        assert_eq!(O::difference(&O::concat(&a, &b), &a), b);
+    }
+
+    #[test]
+    fn impl_for_u64() {
+        assert_laws(3, 5);
+    }
+
+    #[test]
+    fn impl_for_vec() {
+        assert_laws(vec![0, 1, 2, 3], vec![0, 2, 4, 6]);
+    }
+}
diff --git a/cranelift/peepmatic/crates/automata/src/serde_impls.rs b/cranelift/peepmatic/crates/automata/src/serde_impls.rs
new file mode 100644
index 0000000000..8a5d79214f
--- /dev/null
+++ b/cranelift/peepmatic/crates/automata/src/serde_impls.rs
@@ -0,0 +1,220 @@
+//! `serde::Serialize` and `serde::Deserialize` implementations for `Automaton`.
+//!
+//! Rather than prefix each serialized field with which field it is, we always
+//! serialize fields in alphabetical order. Make sure to maintain this if you
+//! add or remove fields!
+//!
+//! Each time you add/remove a field, or change serialization in any other way,
+//! make sure to bump `SERIALIZATION_VERSION`.
+
+use crate::{Automaton, Output, State};
+use serde::{
+    de::{self, Deserializer, SeqAccess, Visitor},
+    ser::SerializeTupleStruct,
+    Deserialize, Serialize, Serializer,
+};
+use std::collections::BTreeMap;
+use std::fmt;
+use std::hash::Hash;
+use std::marker::PhantomData;
+
+const SERIALIZATION_VERSION: u32 = 1;
+
+impl Serialize for State {
+    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
+    where
+        S: Serializer,
+    {
+        serializer.serialize_u32(self.0)
+    }
+}
+
+impl<'de> Deserialize<'de> for State {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        Ok(State(deserializer.deserialize_u32(U32Visitor)?))
+    }
+}
+
+struct U32Visitor;
+
+impl<'de> Visitor<'de> for U32Visitor {
+    type Value = u32;
+
+    fn expecting(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        f.write_str("an integer between `0` and `2^32 - 1`")
+    }
+
+    fn visit_u8<E>(self, value: u8) -> Result<Self::Value, E>
+    where
+        E: de::Error,
+    {
+        Ok(u32::from(value))
+    }
+
+    fn visit_u32<E>(self, value: u32) -> Result<Self::Value, E>
+    where
+        E: de::Error,
+    {
+        Ok(value)
+    }
+
+    fn visit_u64<E>(self, value: u64) -> Result<Self::Value, E>
+    where
+        E: de::Error,
+    {
+        use std::u32;
+        if value <= u64::from(u32::MAX) {
+            Ok(value as u32)
+        } else {
+            Err(E::custom(format!("u32 out of range: {}", value)))
+        }
+    }
+}
+
+impl<TAlphabet, TState, TOutput> Serialize for Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Serialize + Clone + Eq + Hash + Ord,
+    TState: Serialize + Clone + Eq + Hash,
+    TOutput: Serialize + Output,
+{
+    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
+    where
+        S: Serializer,
+    {
+        let Automaton {
+            final_states,
+            start_state,
+            state_data,
+            transitions,
+        } = self;
+
+        let mut s = serializer.serialize_tuple_struct("Automaton", 5)?;
+        s.serialize_field(&SERIALIZATION_VERSION)?;
+        s.serialize_field(final_states)?;
+        s.serialize_field(start_state)?;
+        s.serialize_field(state_data)?;
+        s.serialize_field(transitions)?;
+        s.end()
+    }
+}
+
+impl<'de, TAlphabet, TState, TOutput> Deserialize<'de> for Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: 'de + Deserialize<'de> + Clone + Eq + Hash + Ord,
+    TState: 'de + Deserialize<'de> + Clone + Eq + Hash,
+    TOutput: 'de + Deserialize<'de> + Output,
+{
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        deserializer.deserialize_tuple_struct(
+            "Automaton",
+            5,
+            AutomatonVisitor {
+                phantom: PhantomData,
+            },
+        )
+    }
+}
+
+struct AutomatonVisitor<'de, TAlphabet, TState, TOutput>
+where
+    TAlphabet: 'de + Deserialize<'de> + Clone + Eq + Hash + Ord,
+    TState: 'de + Deserialize<'de> + Clone + Eq + Hash,
+    TOutput: 'de + Deserialize<'de> + Output,
+{
+    phantom: PhantomData<&'de (TAlphabet, TState, TOutput)>,
+}
+
+impl<'de, TAlphabet, TState, TOutput> Visitor<'de>
+    for AutomatonVisitor<'de, TAlphabet, TState, TOutput>
+where
+    TAlphabet: 'de + Deserialize<'de> + Clone + Eq + Hash + Ord,
+    TState: 'de + Deserialize<'de> + Clone + Eq + Hash,
+    TOutput: 'de + Deserialize<'de> + Output,
+{
+    type Value = Automaton<TAlphabet, TState, TOutput>;
+
+    fn expecting(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        f.write_str("Automaton")
+    }
+
+    fn visit_seq<A>(self, mut seq: A) -> Result<Self::Value, A::Error>
+    where
+        A: SeqAccess<'de>,
+    {
+        match seq.next_element::<u32>()? {
+            Some(v) if v == SERIALIZATION_VERSION => {}
+            Some(v) => {
+                return Err(de::Error::invalid_value(
+                    de::Unexpected::Unsigned(v as u64),
+                    &self,
+                ));
+            }
+            None => {
+                return Err(de::Error::invalid_length(
+                    0,
+                    &"Automaton expects 5 elements",
+                ))
+            }
+        }
+
+        let final_states = match seq.next_element::<BTreeMap<State, TOutput>>()? {
+            Some(x) => x,
+            None => {
+                return Err(de::Error::invalid_length(
+                    1,
+                    &"Automaton expects 5 elements",
+                ))
+            }
+        };
+
+        let start_state = match seq.next_element::<State>()? {
+            Some(x) => x,
+            None => {
+                return Err(de::Error::invalid_length(
+                    2,
+                    &"Automaton expects 5 elements",
+                ))
+            }
+        };
+
+        let state_data = match seq.next_element::<Vec<Option<TState>>>()? {
+            Some(x) => x,
+            None => {
+                return Err(de::Error::invalid_length(
+                    3,
+                    &"Automaton expects 5 elements",
+                ))
+            }
+        };
+
+        let transitions = match seq.next_element::<Vec<BTreeMap<TAlphabet, (State, TOutput)>>>()? {
+            Some(x) => x,
+            None => {
+                return Err(de::Error::invalid_length(
+                    4,
+                    &"Automaton expects 5 elements",
+                ))
+            }
+        };
+
+        let automata = Automaton {
+            final_states,
+            start_state,
+            state_data,
+            transitions,
+        };
+
+        // Ensure that the deserialized automata is well-formed.
+        automata
+            .check_representation()
+            .map_err(|msg| de::Error::custom(msg))?;
+
+        Ok(automata)
+    }
+}
diff --git a/cranelift/peepmatic/crates/fuzzing/Cargo.toml b/cranelift/peepmatic/crates/fuzzing/Cargo.toml
new file mode 100644
index 0000000000..a3ccb91791
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/Cargo.toml
@@ -0,0 +1,22 @@
+[package]
+name = "peepmatic-fuzzing"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+publish = false
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+arbitrary = { version = "0.4.1", features = ["derive"] }
+bincode = "1.2.1"
+env_logger = "0.7.1"
+fst = "0.4.1"
+log = "0.4.8"
+peepmatic = { path = "../.." }
+peepmatic-automata = { path = "../automata", features = ["serde"] }
+peepmatic-runtime = { path = "../runtime", features = ["construct"] }
+peepmatic-test = { path = "../test" }
+rand = { version = "0.7.3", features = ["small_rng"] }
+serde = "1.0.106"
+wast = "15.0.0"
diff --git a/cranelift/peepmatic/crates/fuzzing/src/automata.rs b/cranelift/peepmatic/crates/fuzzing/src/automata.rs
new file mode 100644
index 0000000000..c399da037f
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/src/automata.rs
@@ -0,0 +1,187 @@
+//! Helpers for fuzzing the `peepmatic-automata` crate.
+
+use peepmatic_automata::{Automaton, Builder, Output};
+use serde::{Deserialize, Serialize};
+use std::collections::{HashMap, HashSet};
+use std::hash::Hash;
+
+fn serde_roundtrip<TAlphabet, TState, TOutput>(
+    automata: Automaton<TAlphabet, TState, TOutput>,
+) -> Automaton<TAlphabet, TState, TOutput>
+where
+    TAlphabet: Serialize + for<'de> Deserialize<'de> + Clone + Eq + Hash + Ord,
+    TState: Serialize + for<'de> Deserialize<'de> + Clone + Eq + Hash,
+    TOutput: Serialize + for<'de> Deserialize<'de> + Output,
+{
+    let encoded: Vec<u8> = bincode::serialize(&automata).expect("should serialize OK");
+    bincode::deserialize(&encoded).expect("should deserialize OK")
+}
+
+/// Construct an automaton from the the given input-output pairs, and assert
+/// that:
+///
+/// * Putting in each of the input strings should result in the expected output
+///   string.
+///
+/// * Putting in an input string that is not one of the given inputs from our
+///   input-output pairs should never yield an output value.
+pub fn simple_automata(input_output_pairs: Vec<Vec<(u8, Vec<u8>)>>) {
+    let _ = env_logger::try_init();
+
+    let full_input = |pair: &[(u8, Vec<u8>)]| {
+        let mut full_input = vec![];
+        for (input, _) in pair {
+            full_input.push(*input);
+        }
+        full_input
+    };
+
+    let mut inputs = HashSet::new();
+
+    let mut input_output_pairs: Vec<_> = input_output_pairs
+        .into_iter()
+        .filter(|pair| {
+            !pair.is_empty() && {
+                // Make sure we don't have duplicate inputs.
+                let is_new = inputs.insert(full_input(pair));
+                is_new
+            }
+        })
+        .collect();
+
+    input_output_pairs.sort_by(|a, b| full_input(a).cmp(&full_input(b)));
+
+    if input_output_pairs.is_empty() {
+        return;
+    }
+
+    // A map from one of our concatenated input strings to its concatenated
+    // output.
+    let mut expected = HashMap::with_capacity(input_output_pairs.len());
+
+    let mut builder = Builder::<u8, (), Vec<u8>>::new();
+    for pair in &input_output_pairs {
+        let mut full_input = vec![];
+        let mut full_output = vec![];
+
+        let mut ins = builder.insert();
+        for (input, output) in pair.iter().cloned() {
+            full_input.push(input);
+            full_output.extend(output.iter().copied());
+
+            ins.next(input, output);
+        }
+
+        let old = expected.insert(full_input, full_output);
+        assert!(old.is_none());
+
+        ins.finish();
+    }
+
+    let automata = builder.finish();
+    let automata = serde_roundtrip(automata);
+
+    // Assert that each of our input strings yields the expected output.
+    for (input, expected_output) in &expected {
+        log::debug!("Testing input: {:?}", input);
+        let actual_output = automata.get(input);
+        assert!(actual_output.is_some());
+        assert_eq!(actual_output.as_ref().unwrap(), expected_output);
+    }
+
+    // Test that mutations of our input strings (that aren't themselves other
+    // input strings!) do not yeild any output.
+    for input in expected.keys() {
+        for i in 0..input.len() {
+            let mut mutated = input.clone();
+            mutated[i] = mutated[i].wrapping_add(1);
+            log::debug!("Testing mutated input: {:?}", mutated);
+            if !expected.contains_key(&mutated) {
+                assert!(automata.get(&mutated).is_none());
+            }
+        }
+    }
+}
+
+/// Do differential testing against the `fst` crate, which is another
+/// implementation of the algorithm we use for finite-state transducer
+/// construction in `peepmatic-automata`.
+pub fn fst_differential(map: HashMap<Vec<u8>, u64>) {
+    let _ = env_logger::try_init();
+
+    let mut inputs: Vec<_> = map.keys().filter(|i| !i.is_empty()).cloned().collect();
+    inputs.sort();
+    inputs.dedup();
+    if inputs.is_empty() {
+        return;
+    }
+
+    let mut fst = fst::MapBuilder::memory();
+    let mut builder = Builder::<u8, (), u64>::new();
+
+    for inp in &inputs {
+        fst.insert(inp, map[inp]).unwrap();
+
+        let mut ins = builder.insert();
+        for (i, ch) in inp.iter().enumerate() {
+            ins.next(*ch, if i == 0 { map[inp] } else { 0 });
+        }
+        ins.finish();
+    }
+
+    let fst = fst.into_map();
+    let automata = builder.finish();
+    let automata = serde_roundtrip(automata);
+
+    for inp in inputs {
+        // Check we have the same result as `fst` for inputs we know are in the
+        // automata.
+        log::debug!("Testing input {:?}", inp);
+        let expected = fst.get(&inp).expect("`fst` should have entry for `inp`");
+        let actual = automata
+            .get(&inp)
+            .expect("automata should have entry for `inp`");
+        assert_eq!(expected, actual);
+
+        // Check that we have the same result as `fst` for inputs that may or
+        // may not be in the automata.
+        for i in 0..inp.len() {
+            let mut mutated = inp.clone();
+            mutated[i] = mutated[i].wrapping_add(1);
+            log::debug!("Testing mutated input {:?}", mutated);
+            let expected = fst.get(&mutated);
+            let actual = automata.get(&mutated);
+            assert_eq!(expected, actual);
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn check_simple_automata() {
+        crate::check(simple_automata);
+    }
+
+    #[test]
+    fn check_fst_differential() {
+        crate::check(fst_differential);
+    }
+
+    #[test]
+    fn regression_test_0() {
+        simple_automata(vec![vec![(0, vec![0]), (0, vec![1])], vec![(0, vec![2])]]);
+    }
+
+    #[test]
+    fn regression_test_1() {
+        fst_differential(vec![(vec![1, 3], 5), (vec![1, 2], 4)].into_iter().collect());
+    }
+
+    #[test]
+    fn regression_test_2() {
+        simple_automata(vec![vec![(0, vec![11]), (0, vec![])], vec![(0, vec![11])]]);
+    }
+}
diff --git a/cranelift/peepmatic/crates/fuzzing/src/compile.rs b/cranelift/peepmatic/crates/fuzzing/src/compile.rs
new file mode 100644
index 0000000000..8df8a685c5
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/src/compile.rs
@@ -0,0 +1,71 @@
+//! Fuzz testing utilities related to AST pattern matching.
+
+use peepmatic_runtime::PeepholeOptimizations;
+use std::path::Path;
+use std::str;
+
+/// Attempt to interpret the given bytes as UTF-8 and then compile them as if
+/// they were source text of our DSL.
+pub fn compile(data: &[u8]) {
+    let source = match str::from_utf8(data) {
+        Err(_) => return,
+        Ok(s) => s,
+    };
+
+    let opt = match peepmatic::compile_str(source, Path::new("fuzz")) {
+        Err(_) => return,
+        Ok(o) => o,
+    };
+
+    // Should be able to serialize and deserialize the peephole optimizer.
+    let opt_bytes = bincode::serialize(&opt).expect("should serialize peephole optimizations OK");
+    let _: PeepholeOptimizations =
+        bincode::deserialize(&opt_bytes).expect("should deserialize peephole optimizations OK");
+
+    // Compiling the same source text again should be deterministic.
+    let opt2 = peepmatic::compile_str(source, Path::new("fuzz"))
+        .expect("should be able to compile source text again, if it compiled OK the first time");
+    let opt2_bytes =
+        bincode::serialize(&opt2).expect("should serialize second peephole optimizations OK");
+    assert_eq!(opt_bytes, opt2_bytes);
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn check_compile() {
+        crate::check(|s: String| compile(s.as_bytes()));
+    }
+
+    #[test]
+    fn regression_0() {
+        compile(
+            b"
+            (=> (bor (bor $x $y) $y) $x)
+            (=> (bor (bor $x $z) $y) $x)
+        ",
+        );
+    }
+
+    #[test]
+    fn regression_1() {
+        compile(
+            b"
+            (=> (bor (bor $x $y) 0) $x)
+            (=> (bor $x 0) $x)
+            (=> (bor $y $x) $x)
+        ",
+        );
+    }
+
+    #[test]
+    fn regression_2() {
+        compile(
+            b"
+            (=> (sshr $x 11111111110) $x)
+        ",
+        );
+    }
+}
diff --git a/cranelift/peepmatic/crates/fuzzing/src/interp.rs b/cranelift/peepmatic/crates/fuzzing/src/interp.rs
new file mode 100644
index 0000000000..0ebdeebe28
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/src/interp.rs
@@ -0,0 +1,374 @@
+//! Interpreting compiled peephole optimizations against test instruction sequences.
+
+use peepmatic::{
+    Constraint, Dfs, DynAstRef, Optimizations, Pattern, Span, TraversalEvent, ValueLiteral,
+    Variable,
+};
+use peepmatic_runtime::{
+    cc::ConditionCode,
+    operator::TypingContext as TypingContextTrait,
+    part::Constant,
+    r#type::BitWidth,
+    r#type::{Kind, Type},
+};
+use peepmatic_test::{Program, TestIsa};
+use std::collections::{BTreeMap, HashMap};
+use std::path::Path;
+use std::str;
+
+/// Compile the given source text, and if it is a valid set of optimizations,
+/// then interpret the optimizations against test instruction sequences created
+/// to reflect the optimizations.
+pub fn interp(data: &[u8]) {
+    let _ = env_logger::try_init();
+
+    let source = match str::from_utf8(data) {
+        Err(_) => return,
+        Ok(s) => s,
+    };
+
+    let peep_opts = match peepmatic::compile_str(source, Path::new("fuzz")) {
+        Err(_) => return,
+        Ok(o) => o,
+    };
+    let mut optimizer = peep_opts.optimizer(TestIsa {
+        native_word_size_in_bits: 32,
+    });
+
+    // Okay, we know it compiles and verifies alright, so (re)parse the AST.
+    let buf = wast::parser::ParseBuffer::new(&source).unwrap();
+    let ast = wast::parser::parse::<Optimizations>(&buf).unwrap();
+
+    // And we need access to the assigned types, so re-verify it as well.
+    peepmatic::verify(&ast).unwrap();
+
+    // Walk over each optimization and create an instruction sequence that
+    // matches the optimization.
+    let mut program = Program::default();
+    for opt in &ast.optimizations {
+        // The instruction sequence we generate must match an optimization (not
+        // necessarily *this* optimization, if there is another that is more
+        // specific but also matches) unless there is an `bit-width`
+        // precondition or an implicit `bit-width` precondition via a type
+        // ascription. When those things exist, we might have constructed
+        // instructions with the wrong bit widths to match.
+        let mut allow_no_match = false;
+
+        // The last instruction we generated. After we've generated the full
+        // instruction sequence, this will be its root.
+        let mut last_inst = None;
+
+        // Remember the instructions associated with variables and constants, so
+        // that when they appear multiple times, we reuse the same instruction.
+        let mut id_to_inst = HashMap::new();
+
+        // Map from a pattern's span to the instruction we generated for
+        // it. This allows parent operations to get the instructions for their
+        // children.
+        let mut span_to_inst = BTreeMap::new();
+
+        for (te, lhs) in Dfs::new(&opt.lhs) {
+            // NB: We use a post-order traversal because we want arguments to be
+            // generated before they are used.
+            if te != TraversalEvent::Exit {
+                continue;
+            }
+
+            match lhs {
+                DynAstRef::Precondition(p) => {
+                    allow_no_match |= p.constraint == Constraint::BitWidth;
+                }
+
+                DynAstRef::Pattern(Pattern::Operation(op)) => {
+                    allow_no_match |= op.r#type.get().is_some();
+
+                    let num_imms = op.operator.immediates_arity() as usize;
+
+                    // Generate this operation's immediates.
+                    let mut imm_tys = vec![];
+                    op.operator
+                        .immediate_types(&mut TypingContext, op.span(), &mut imm_tys);
+                    let imms: Vec<_> = op
+                        .operands
+                        .iter()
+                        .take(num_imms)
+                        .zip(imm_tys)
+                        .map(|(pat, ty)| match pat {
+                            Pattern::ValueLiteral(ValueLiteral::Integer(i)) => {
+                                Constant::Int(i.value as _, BitWidth::ThirtyTwo).into()
+                            }
+                            Pattern::ValueLiteral(ValueLiteral::Boolean(b)) => {
+                                Constant::Bool(b.value, BitWidth::One).into()
+                            }
+                            Pattern::ValueLiteral(ValueLiteral::ConditionCode(cc)) => cc.cc.into(),
+                            Pattern::Constant(_) | Pattern::Variable(_) => match ty {
+                                TypeOrConditionCode::ConditionCode => ConditionCode::Eq.into(),
+                                TypeOrConditionCode::Type(ty) => match ty.kind {
+                                    Kind::Int => Constant::Int(1, ty.bit_width).into(),
+                                    Kind::Bool => Constant::Bool(false, ty.bit_width).into(),
+                                    Kind::Void | Kind::CpuFlags => {
+                                        unreachable!("void and cpu flags cannot be immediates")
+                                    }
+                                },
+                            },
+                            Pattern::Operation(_) => {
+                                unreachable!("operations not allowed as immediates")
+                            }
+                        })
+                        .collect();
+
+                    // Generate (or collect already-generated) instructions for
+                    // this operation's arguments.
+                    let mut arg_tys = vec![];
+                    op.operator
+                        .param_types(&mut TypingContext, op.span(), &mut arg_tys);
+                    let args: Vec<_> = op
+                        .operands
+                        .iter()
+                        .skip(num_imms)
+                        .zip(arg_tys)
+                        .map(|(pat, ty)| match pat {
+                            Pattern::Operation(op) => span_to_inst[&op.span()],
+                            Pattern::ValueLiteral(ValueLiteral::Integer(i)) => program.r#const(
+                                Constant::Int(i.value as _, BitWidth::ThirtyTwo),
+                                BitWidth::ThirtyTwo,
+                            ),
+                            Pattern::ValueLiteral(ValueLiteral::Boolean(b)) => program.r#const(
+                                Constant::Bool(b.value, BitWidth::One),
+                                BitWidth::ThirtyTwo,
+                            ),
+                            Pattern::ValueLiteral(ValueLiteral::ConditionCode(_)) => {
+                                unreachable!("condition codes cannot be arguments")
+                            }
+                            Pattern::Constant(peepmatic::Constant { id, .. })
+                            | Pattern::Variable(Variable { id, .. }) => match ty {
+                                TypeOrConditionCode::Type(ty) => {
+                                    *id_to_inst.entry(id).or_insert_with(|| match ty.kind {
+                                        Kind::Int => program.r#const(
+                                            Constant::Int(1, ty.bit_width),
+                                            BitWidth::ThirtyTwo,
+                                        ),
+                                        Kind::Bool => program.r#const(
+                                            Constant::Bool(false, ty.bit_width),
+                                            BitWidth::ThirtyTwo,
+                                        ),
+                                        Kind::CpuFlags => {
+                                            unreachable!("cpu flags cannot be an argument")
+                                        }
+                                        Kind::Void => unreachable!("void cannot be an argument"),
+                                    })
+                                }
+                                TypeOrConditionCode::ConditionCode => {
+                                    unreachable!("condition codes cannot be arguments")
+                                }
+                            },
+                        })
+                        .collect();
+
+                    let ty = match op.operator.result_type(&mut TypingContext, op.span()) {
+                        TypeOrConditionCode::Type(ty) => ty,
+                        TypeOrConditionCode::ConditionCode => {
+                            unreachable!("condition codes cannot be operation results")
+                        }
+                    };
+                    let inst = program.new_instruction(op.operator, ty, imms, args);
+                    last_inst = Some(inst);
+                    let old_inst = span_to_inst.insert(op.span(), inst);
+                    assert!(old_inst.is_none());
+                }
+                _ => continue,
+            }
+        }
+
+        // Run the optimizer on our newly generated instruction sequence.
+        if let Some(inst) = last_inst {
+            let replacement = optimizer.apply_one(&mut program, inst);
+            assert!(
+                replacement.is_some() || allow_no_match,
+                "an optimization should match the generated instruction sequence"
+            );
+        }
+    }
+
+    // Finally, just try and run the optimizer on every instruction we
+    // generated, just to potentially shake out some more bugs.
+    let instructions: Vec<_> = program.instructions().map(|(k, _)| k).collect();
+    for inst in instructions {
+        let _ = optimizer.apply_one(&mut program, inst);
+    }
+}
+
+enum TypeOrConditionCode {
+    Type(Type),
+    ConditionCode,
+}
+
+struct TypingContext;
+
+impl<'a> TypingContextTrait<'a> for TypingContext {
+    type TypeVariable = TypeOrConditionCode;
+
+    fn cc(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::ConditionCode
+    }
+
+    fn bNN(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::b1())
+    }
+
+    fn iNN(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::i32())
+    }
+
+    fn iMM(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::i32())
+    }
+
+    fn cpu_flags(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::cpu_flags())
+    }
+
+    fn b1(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::b1())
+    }
+
+    fn void(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::void())
+    }
+
+    fn bool_or_int(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::b1())
+    }
+
+    fn any_t(&mut self, _: wast::Span) -> Self::TypeVariable {
+        TypeOrConditionCode::Type(Type::i32())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn check_interp() {
+        crate::check(|s: Vec<u8>| interp(String::from_utf8_lossy(&s).as_bytes()));
+    }
+
+    #[test]
+    fn regression_0() {
+        interp(b"(=> (imul $x $x) $x)");
+    }
+
+    #[test]
+    fn regression_1() {
+        interp(b"(=> (when (imul $x $C) (is-power-of-two $C)) $x)");
+    }
+
+    #[test]
+    fn regression_2() {
+        interp(
+            b"
+            (=> (bor (bor $x $y) $x) (bor $x $y))
+            (=> (bor (bor $x $C) 5) $x)
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_3() {
+        interp(
+            b"
+            (=> (bor $y (bor $x 9)) $x)
+            (=> (bor (bor $x $y) $x) $x)
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_4() {
+        interp(
+            b"
+            (=> (bor $C 33) 0)
+            (=> (bor $x 22) 1)
+            (=> (bor $x 11) 2)
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_5() {
+        interp(
+            b"
+            (=> (bor $y (bor $x $y)) (bor $x $y))
+            (=> (bor (bor $x $y) $z) $x)
+            (=> (bor (bor $x $y) $y) $x)
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_6() {
+        interp(b"(=> (imul $x $f) of)");
+    }
+
+    #[test]
+    fn regression_7() {
+        interp(
+            b"
+            (=> (when (sdiv $x $C)
+                      (fits-in-native-word $y))
+                (sdiv $C $x))
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_8() {
+        interp(
+            b"
+            (=> (adjust_sp_down $C) (adjust_sp_down_imm $C))
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_9() {
+        interp(
+            b"
+            (=> (when $x) $x)
+            (=> (trapnz $x) (trapnz $x))
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_10() {
+        interp(b"(=> (sshr{i1} $x 0) $x)");
+    }
+
+    #[test]
+    fn regression_11() {
+        interp(
+            b"
+            (=> (when (ushr_imm $x (ishl 4 3))
+                      (bit-width $x 64))
+                (sextend{i64} (ireduce{i32} $x)))
+            ",
+        );
+    }
+
+    #[test]
+    fn regression_12() {
+        interp(b"(=> (band $C1 (band_imm $C1 1)) 1)");
+    }
+
+    #[test]
+    fn regression_13() {
+        interp(b"(=> (brz (icmp eq 0 $x)) (brz (ireduce{i32} $x)))");
+    }
+
+    #[test]
+    fn regression_14() {
+        interp(b"(=> (brz (icmp $E 0 $x)) (brz $x))");
+    }
+}
diff --git a/cranelift/peepmatic/crates/fuzzing/src/lib.rs b/cranelift/peepmatic/crates/fuzzing/src/lib.rs
new file mode 100644
index 0000000000..82661d8b7d
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/src/lib.rs
@@ -0,0 +1,119 @@
+//! Utilities for fuzzing.
+//!
+//! The actual fuzz targets are defined in `peepmatic/fuzz/*`. This crate just
+//! has oracles and generators for fuzzing.
+
+#![deny(missing_debug_implementations)]
+#![deny(missing_docs)]
+
+use arbitrary::{Arbitrary, Unstructured};
+use rand::prelude::*;
+use std::fmt::Debug;
+use std::panic;
+use std::time;
+
+pub mod automata;
+pub mod compile;
+pub mod interp;
+pub mod parser;
+
+/// A quickcheck-style runner for fuzz targets.
+///
+/// This is *not* intended to replace a long-running, coverage-guided fuzzing
+/// engine like libFuzzer! This is only for defining quick, purely random tests
+/// for use with `cargo test` and CI.
+pub fn check<A>(mut f: impl FnMut(A))
+where
+    A: Clone + Debug + Arbitrary,
+{
+    let seed = rand::thread_rng().gen();
+    let mut rng = rand::rngs::SmallRng::seed_from_u64(seed);
+
+    const INITIAL_LENGTH: usize = 16;
+    const MAX_LENGTH: usize = 4096;
+
+    let mut buf: Vec<u8> = (0..INITIAL_LENGTH).map(|_| rng.gen()).collect();
+    let mut num_checked = 0;
+
+    let time_budget = time::Duration::from_secs(2);
+    let then = time::Instant::now();
+
+    let (failing_input, panic_info) = loop {
+        if num_checked > 0 && time::Instant::now().duration_since(then) > time_budget {
+            eprintln!("Checked {} random inputs.", num_checked);
+            return;
+        }
+
+        match <A as Arbitrary>::arbitrary_take_rest(Unstructured::new(&buf)) {
+            Ok(input) => {
+                num_checked += 1;
+                eprintln!("Checking input: {:#?}", input);
+                if let Err(p) = panic::catch_unwind(panic::AssertUnwindSafe(|| f(input.clone()))) {
+                    break (input, p);
+                }
+            }
+            Err(e @ arbitrary::Error::NotEnoughData) => {
+                eprintln!("warning: {}", e);
+                if *buf.last().unwrap() == 0 {
+                    if buf.len() < MAX_LENGTH {
+                        let new_size = std::cmp::min(buf.len() * 2, MAX_LENGTH);
+                        eprintln!("Growing buffer size to {}", new_size);
+                        let delta = new_size - buf.len();
+                        buf.reserve(delta);
+                        for _ in 0..delta {
+                            buf.push(rng.gen());
+                        }
+                        continue;
+                    } else {
+                        // Regenerate `buf` in the loop below and see if that
+                        // fixes things...
+                        eprintln!("Regenerating buffer data.");
+                    }
+                } else {
+                    // Shrink values in the end of `buf`, which is where
+                    // `Arbitrary` pulls container lengths from. Then try again.
+                    eprintln!("Shrinking buffer's tail values.");
+                    let i = (buf.len() as f64).sqrt() as usize;
+                    for j in i..buf.len() {
+                        buf[j] /= 2;
+                    }
+                    continue;
+                }
+            }
+            Err(e) => {
+                eprintln!("warning: {}", e);
+                // Usually this happens because `A` requires a sequence utf-8
+                // bytes but its given sequence wasn't valid utf-8. Just skip
+                // this iteration and try again after we've updated `buf` below.
+            }
+        };
+
+        // Double the size of the buffer every so often, so we don't only
+        // explore small inputs.
+        if num_checked == buf.len() {
+            buf.resize(std::cmp::min(buf.len() * 2, MAX_LENGTH), 0);
+        }
+
+        for i in 0..buf.len() {
+            buf[i] = rng.gen();
+        }
+    };
+
+    // Shrink the failing input.
+    let mut smallest_failing_input = failing_input;
+    let mut panic_info = panic_info;
+    'shrinking: loop {
+        eprintln!("Smallest failing input: {:#?}", smallest_failing_input);
+        for input in smallest_failing_input.shrink() {
+            if let Err(p) = panic::catch_unwind(panic::AssertUnwindSafe(|| f(input.clone()))) {
+                smallest_failing_input = input;
+                panic_info = p;
+                continue 'shrinking;
+            }
+        }
+        break;
+    }
+
+    // Resume the panic for the smallest input.
+    panic::resume_unwind(panic_info);
+}
diff --git a/cranelift/peepmatic/crates/fuzzing/src/parser.rs b/cranelift/peepmatic/crates/fuzzing/src/parser.rs
new file mode 100644
index 0000000000..a9972ff7ff
--- /dev/null
+++ b/cranelift/peepmatic/crates/fuzzing/src/parser.rs
@@ -0,0 +1,29 @@
+//! Utilities for fuzzing our DSL's parser.
+
+use peepmatic::Optimizations;
+use std::str;
+
+/// Attempt to parse the given string as if it were a snippet of our DSL.
+pub fn parse(data: &[u8]) {
+    let source = match str::from_utf8(data) {
+        Ok(s) => s,
+        Err(_) => return,
+    };
+
+    let buf = match wast::parser::ParseBuffer::new(&source) {
+        Ok(buf) => buf,
+        Err(_) => return,
+    };
+
+    let _ = wast::parser::parse::<Optimizations>(&buf);
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn check_parse() {
+        crate::check(|s: String| parse(s.as_bytes()));
+    }
+}
diff --git a/cranelift/peepmatic/crates/macro/Cargo.toml b/cranelift/peepmatic/crates/macro/Cargo.toml
new file mode 100644
index 0000000000..e13cffd988
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/Cargo.toml
@@ -0,0 +1,15 @@
+[package]
+name = "peepmatic-macro"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+proc-macro2 = "1.0.9"
+quote = "1.0.3"
+syn = { version = "1.0.16", features = ['extra-traits'] }
+
+[lib]
+proc_macro = true
diff --git a/cranelift/peepmatic/crates/macro/src/child_nodes.rs b/cranelift/peepmatic/crates/macro/src/child_nodes.rs
new file mode 100644
index 0000000000..c71ac409a0
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/src/child_nodes.rs
@@ -0,0 +1,110 @@
+use quote::quote;
+use syn::DeriveInput;
+use syn::{parse_quote, GenericParam, Generics, Result};
+
+pub fn derive_child_nodes(input: &DeriveInput) -> Result<impl quote::ToTokens> {
+    let children = get_child_nodes(&input.data)?;
+    let name = &input.ident;
+    let generics = add_trait_bounds(input.generics.clone());
+    let (impl_generics, ty_generics, where_clause) = generics.split_for_impl();
+
+    Ok(quote! {
+        impl #impl_generics ChildNodes<'a, 'a> for #name #ty_generics #where_clause {
+            fn child_nodes(&'a self, children: &mut impl Extend<DynAstRef<'a>>) {
+                #children
+            }
+        }
+    })
+}
+
+fn get_child_nodes(data: &syn::Data) -> Result<impl quote::ToTokens> {
+    match data {
+        syn::Data::Struct(s) => {
+            let mut fields = vec![];
+
+            match &s.fields {
+                syn::Fields::Named(n) => {
+                    for f in n.named.iter() {
+                        let opts = crate::PeepmaticOpts::from_attrs(&mut f.attrs.clone())?;
+
+                        if opts.skip_child {
+                            continue;
+                        }
+
+                        let field_name = f.ident.as_ref().unwrap();
+                        if opts.flatten {
+                            fields.push(quote! {
+                                self.#field_name.iter().map(DynAstRef::from)
+                            });
+                        } else {
+                            fields.push(quote! {
+                                std::iter::once(DynAstRef::from(&self.#field_name))
+                            });
+                        }
+                    }
+                }
+                syn::Fields::Unnamed(u) => {
+                    for (i, f) in u.unnamed.iter().enumerate() {
+                        let opts = crate::PeepmaticOpts::from_attrs(&mut f.attrs.clone())?;
+                        if opts.skip_child {
+                            continue;
+                        }
+                        if opts.flatten {
+                            return Err(syn::Error::new(
+                                u.paren_token.span,
+                                "#[peepmatic(flatten)] is only allowed with named fields",
+                            ));
+                        }
+                        fields.push(quote! {
+                            std::iter::once(DynAstRef::from(&self.#i))
+                        });
+                    }
+                }
+                syn::Fields::Unit => {}
+            }
+
+            Ok(match fields.as_slice() {
+                [] => quote! { let _ = children; },
+                [f, rest @ ..] => {
+                    let rest = rest.iter().map(|f| {
+                        quote! {
+                            .chain(#f)
+                        }
+                    });
+                    quote! {
+                        children.extend( #f #( #rest )* );
+                    }
+                }
+            })
+        }
+        syn::Data::Enum(e) => {
+            let mut match_arms = vec![];
+            for v in e.variants.iter() {
+                match v.fields {
+                    syn::Fields::Unnamed(ref u) if u.unnamed.len() == 1 => {
+                        let variant = &v.ident;
+                        match_arms.push(quote! {
+                            Self::#variant(x) => children.extend(Some(x.into())),
+                        });
+                    }
+                    _ => panic!("#[derive(ChildNodes)] only supports enums whose variants all ahve a single unnamed field")
+                }
+            }
+            Ok(quote! {
+                match self {
+                    #( #match_arms )*
+                }
+            })
+        }
+        syn::Data::Union(_) => panic!("#[derive(ChildNodes)] is not supported on unions"),
+    }
+}
+
+fn add_trait_bounds(mut generics: Generics) -> Generics {
+    for param in &mut generics.params {
+        if let GenericParam::Type(type_param) = param {
+            type_param.bounds.push(parse_quote!(ChildNodes<'a, 'a>));
+        }
+    }
+    generics
+}
diff --git a/cranelift/peepmatic/crates/macro/src/into_dyn_ast_ref.rs b/cranelift/peepmatic/crates/macro/src/into_dyn_ast_ref.rs
new file mode 100644
index 0000000000..4cd993a72c
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/src/into_dyn_ast_ref.rs
@@ -0,0 +1,23 @@
+use quote::quote;
+use syn::DeriveInput;
+use syn::Result;
+
+pub fn derive_into_dyn_ast_ref(input: &DeriveInput) -> Result<impl quote::ToTokens> {
+    let ty = &input.ident;
+
+    let opts = crate::PeepmaticOpts::from_attrs(&mut input.attrs.clone())?;
+    if opts.no_into_dyn_node {
+        return Ok(quote! {});
+    }
+
+    let (impl_generics, ty_generics, where_clause) = input.generics.split_for_impl();
+
+    Ok(quote! {
+        impl #impl_generics From<&'a #ty #ty_generics> for DynAstRef<'a> #where_clause {
+            #[inline]
+            fn from(x: &'a #ty #ty_generics) -> Self {
+                Self::#ty(x)
+            }
+        }
+    })
+}
diff --git a/cranelift/peepmatic/crates/macro/src/lib.rs b/cranelift/peepmatic/crates/macro/src/lib.rs
new file mode 100644
index 0000000000..5375947c36
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/src/lib.rs
@@ -0,0 +1,156 @@
+extern crate proc_macro;
+
+use crate::proc_macro::TokenStream;
+use proc_macro2::Span;
+use quote::quote;
+use syn::parse::{Parse, ParseStream};
+use syn::punctuated::Punctuated;
+use syn::DeriveInput;
+use syn::Error;
+use syn::{parse_macro_input, Ident, Result};
+
+mod child_nodes;
+mod into_dyn_ast_ref;
+mod operator;
+mod span;
+
+#[proc_macro_derive(PeepmaticOperator, attributes(peepmatic))]
+pub fn operator(input: TokenStream) -> TokenStream {
+    operator::derive_operator(input)
+}
+
+#[proc_macro_derive(Ast, attributes(peepmatic))]
+pub fn derive_ast(input: TokenStream) -> TokenStream {
+    let input = parse_macro_input!(input as DeriveInput);
+
+    let span_impl = match span::derive_span(&input) {
+        Ok(s) => s,
+        Err(e) => return e.to_compile_error().into(),
+    };
+
+    let child_nodes_impl = match child_nodes::derive_child_nodes(&input) {
+        Ok(c) => c,
+        Err(e) => return e.to_compile_error().into(),
+    };
+
+    let into_dyn_ast_ref_impl = match into_dyn_ast_ref::derive_into_dyn_ast_ref(&input) {
+        Ok(n) => n,
+        Err(e) => return e.to_compile_error().into(),
+    };
+
+    let expanded = quote! {
+        #span_impl
+        #child_nodes_impl
+        #into_dyn_ast_ref_impl
+    };
+
+    TokenStream::from(expanded)
+}
+
+#[derive(Default)]
+pub(crate) struct PeepmaticOpts {
+    // `ChildNodes` options.
+    skip_child: bool,
+    flatten: bool,
+
+    // `From<&'a Self> for DynAstRef<'a>` options.
+    no_into_dyn_node: bool,
+
+    // Peepmatic operator options.
+    immediates_paren: syn::token::Paren,
+    immediates: Vec<syn::Ident>,
+    params_paren: syn::token::Paren,
+    params: Vec<syn::Ident>,
+    result: Option<syn::Ident>,
+}
+
+impl Parse for PeepmaticOpts {
+    fn parse(input: ParseStream) -> Result<Self> {
+        enum Attr {
+            Immediates(syn::token::Paren, Vec<syn::Ident>),
+            Params(syn::token::Paren, Vec<syn::Ident>),
+            Result(syn::Ident),
+            NoIntoDynNode,
+            SkipChild,
+            Flatten,
+        }
+
+        let attrs = Punctuated::<_, syn::token::Comma>::parse_terminated(input)?;
+        let mut ret = PeepmaticOpts::default();
+        for attr in attrs {
+            match attr {
+                Attr::Immediates(paren, imms) => {
+                    ret.immediates_paren = paren;
+                    ret.immediates = imms;
+                }
+                Attr::Params(paren, ps) => {
+                    ret.params_paren = paren;
+                    ret.params = ps;
+                }
+                Attr::Result(r) => ret.result = Some(r),
+                Attr::NoIntoDynNode => ret.no_into_dyn_node = true,
+                Attr::SkipChild => ret.skip_child = true,
+                Attr::Flatten => ret.flatten = true,
+            }
+        }
+
+        return Ok(ret);
+
+        impl Parse for Attr {
+            fn parse(input: ParseStream) -> Result<Self> {
+                let attr: Ident = input.parse()?;
+                if attr == "immediates" {
+                    let inner;
+                    let paren = syn::parenthesized!(inner in input);
+                    let imms = Punctuated::<_, syn::token::Comma>::parse_terminated(&inner)?;
+                    return Ok(Attr::Immediates(paren, imms.into_iter().collect()));
+                }
+                if attr == "params" {
+                    let inner;
+                    let paren = syn::parenthesized!(inner in input);
+                    let params = Punctuated::<_, syn::token::Comma>::parse_terminated(&inner)?;
+                    return Ok(Attr::Params(paren, params.into_iter().collect()));
+                }
+                if attr == "result" {
+                    let inner;
+                    syn::parenthesized!(inner in input);
+                    return Ok(Attr::Result(syn::Ident::parse(&inner)?));
+                }
+                if attr == "skip_child" {
+                    return Ok(Attr::SkipChild);
+                }
+                if attr == "no_into_dyn_node" {
+                    return Ok(Attr::NoIntoDynNode);
+                }
+                if attr == "flatten" {
+                    return Ok(Attr::Flatten);
+                }
+                return Err(Error::new(attr.span(), "unexpected attribute"));
+            }
+        }
+    }
+}
+
+fn peepmatic_attrs(attrs: &mut Vec<syn::Attribute>) -> TokenStream {
+    let mut ret = proc_macro2::TokenStream::new();
+    let ident = syn::Path::from(syn::Ident::new("peepmatic", Span::call_site()));
+    for i in (0..attrs.len()).rev() {
+        if attrs[i].path != ident {
+            continue;
+        }
+        let attr = attrs.remove(i);
+        let group = match attr.tokens.into_iter().next().unwrap() {
+            proc_macro2::TokenTree::Group(g) => g,
+            _ => panic!("#[peepmatic(...)] expected"),
+        };
+        ret.extend(group.stream());
+        ret.extend(quote! { , });
+    }
+    return ret.into();
+}
+
+impl PeepmaticOpts {
+    pub(crate) fn from_attrs(attrs: &mut Vec<syn::Attribute>) -> syn::Result<Self> {
+        syn::parse(peepmatic_attrs(attrs))
+    }
+}
diff --git a/cranelift/peepmatic/crates/macro/src/operator.rs b/cranelift/peepmatic/crates/macro/src/operator.rs
new file mode 100644
index 0000000000..0d53a1219d
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/src/operator.rs
@@ -0,0 +1,325 @@
+//! Implementation of the `#[peepmatic]` macro for the `Operator` AST node.
+
+use crate::proc_macro::TokenStream;
+use crate::PeepmaticOpts;
+use proc_macro2::{Ident, Span};
+use quote::quote;
+use syn::DeriveInput;
+use syn::Error;
+use syn::{parse_macro_input, Result};
+
+pub fn derive_operator(input: TokenStream) -> TokenStream {
+    let input = parse_macro_input!(input as DeriveInput);
+
+    let variants = match get_enum_variants(&input) {
+        Ok(v) => v,
+        Err(e) => return e.to_compile_error().into(),
+    };
+
+    let arity = match create_arity(&variants) {
+        Ok(a) => a,
+        Err(e) => return e.to_compile_error().into(),
+    };
+
+    let num_operators = variants.len();
+    let type_methods = create_type_methods(&variants);
+    let parse_impl = create_parse_impl(&input.ident, &variants);
+    let display_impl = create_display_impl(&input.ident, &variants);
+    let try_from_u32_impl = create_try_from_u32_impl(&input.ident, &variants);
+    let ident = &input.ident;
+
+    let expanded = quote! {
+        impl #ident {
+            #arity
+            #type_methods
+
+            /// Get the total number of different operators.
+            pub const fn num_operators() -> usize {
+                #num_operators
+            }
+        }
+
+        #display_impl
+        #try_from_u32_impl
+        #parse_impl
+    };
+
+    // eprintln!("{}", expanded);
+    TokenStream::from(expanded)
+}
+
+fn get_enum_variants(input: &DeriveInput) -> Result<Vec<OperatorVariant>> {
+    let en = match &input.data {
+        syn::Data::Enum(en) => en,
+        syn::Data::Struct(_) => {
+            panic!("can only put #[peepmatic] on an enum; found it on a struct")
+        }
+        syn::Data::Union(_) => panic!("can only put #[peepmatic] on an enum; found it on a union"),
+    };
+    en.variants
+        .iter()
+        .cloned()
+        .map(|mut variant| {
+            Ok(OperatorVariant {
+                opts: PeepmaticOpts::from_attrs(&mut variant.attrs)?,
+                syn: variant,
+            })
+        })
+        .collect()
+}
+
+struct OperatorVariant {
+    syn: syn::Variant,
+    opts: PeepmaticOpts,
+}
+
+fn create_arity(variants: &[OperatorVariant]) -> Result<impl quote::ToTokens> {
+    let mut imm_arities = vec![];
+    let mut params_arities = vec![];
+
+    for v in variants {
+        let variant = &v.syn.ident;
+
+        let imm_arity = v.opts.immediates.len();
+        if imm_arity > std::u8::MAX as usize {
+            return Err(Error::new(
+                v.opts.immediates_paren.span,
+                "cannot have more than u8::MAX immediates",
+            ));
+        }
+        let imm_arity = imm_arity as u8;
+
+        imm_arities.push(quote! {
+            Self::#variant => #imm_arity,
+        });
+
+        let params_arity = v.opts.params.len();
+        if params_arity > std::u8::MAX as usize {
+            return Err(Error::new(
+                v.opts.params_paren.span,
+                "cannot have more than u8::MAX params",
+            ));
+        }
+        let params_arity = params_arity as u8;
+
+        params_arities.push(quote! {
+            Self::#variant => #params_arity,
+        });
+    }
+
+    Ok(quote! {
+        /// Get the number of immediates that this operator has.
+        pub fn immediates_arity(&self) -> u8 {
+            match *self {
+                #( #imm_arities )*
+            }
+        }
+
+        /// Get the number of parameters that this operator takes.
+        pub fn params_arity(&self) -> u8 {
+            match *self {
+                #( #params_arities )*
+            }
+        }
+    })
+}
+
+fn create_type_methods(variants: &[OperatorVariant]) -> impl quote::ToTokens {
+    let mut result_types = vec![];
+    let mut imm_types = vec![];
+    let mut param_types = vec![];
+
+    for v in variants {
+        let variant = &v.syn.ident;
+
+        let result_ty = v.opts.result.as_ref().unwrap_or_else(|| {
+            panic!(
+                "must define #[peepmatic(result(..))] on operator `{}`",
+                variant
+            )
+        });
+        result_types.push(quote! {
+            Self::#variant => {
+                context.#result_ty(span)
+            }
+        });
+
+        let imm_tys = match &v.opts.immediates[..] {
+            [] => quote! {},
+            [ty, rest @ ..] => {
+                let rest = rest.iter().map(|ty| {
+                    quote! { .chain(::std::iter::once(context.#ty(span))) }
+                });
+                quote! {
+                    types.extend(::std::iter::once(context.#ty(span))#( #rest )*);
+                }
+            }
+        };
+        imm_types.push(quote! {
+            Self::#variant => {
+                #imm_tys
+            }
+        });
+
+        let param_tys = match &v.opts.params[..] {
+            [] => quote! {},
+            [ty, rest @ ..] => {
+                let rest = rest.iter().map(|ty| {
+                    quote! { .chain(::std::iter::once(context.#ty(span))) }
+                });
+                quote! {
+                    types.extend(::std::iter::once(context.#ty(span))#( #rest )*);
+                }
+            }
+        };
+        param_types.push(quote! {
+            Self::#variant => {
+                #param_tys
+            }
+        });
+    }
+
+    quote! {
+        /// Get the result type of this operator.
+        #[cfg(feature = "construct")]
+        pub fn result_type<'a, C>(
+            &self,
+            context: &mut C,
+            span: wast::Span,
+        ) -> C::TypeVariable
+        where
+            C: 'a + TypingContext<'a>,
+        {
+            match *self {
+                #( #result_types )*
+            }
+        }
+
+        /// Get the immediate types of this operator.
+        #[cfg(feature = "construct")]
+        pub fn immediate_types<'a, C>(
+            &self,
+            context: &mut C,
+            span: wast::Span,
+            types: &mut impl Extend<C::TypeVariable>,
+        )
+        where
+            C: 'a + TypingContext<'a>,
+        {
+            match *self {
+                #( #imm_types )*
+            }
+        }
+
+        /// Get the parameter types of this operator.
+        #[cfg(feature = "construct")]
+        pub fn param_types<'a, C>(
+            &self,
+            context: &mut C,
+            span: wast::Span,
+            types: &mut impl Extend<C::TypeVariable>,
+        )
+        where
+            C: 'a + TypingContext<'a>,
+        {
+            match *self {
+                #( #param_types )*
+            }
+        }
+    }
+}
+
+fn snake_case(s: &str) -> String {
+    let mut t = String::with_capacity(s.len() + 1);
+    for (i, ch) in s.chars().enumerate() {
+        if i != 0 && ch.is_uppercase() {
+            t.push('_');
+        }
+        t.extend(ch.to_lowercase());
+    }
+    t
+}
+
+fn create_parse_impl(ident: &syn::Ident, variants: &[OperatorVariant]) -> impl quote::ToTokens {
+    let token_defs = variants.iter().map(|v| {
+        let tok = snake_case(&v.syn.ident.to_string());
+        let tok = Ident::new(&tok, Span::call_site());
+        quote! {
+            wast::custom_keyword!(#tok);
+        }
+    });
+
+    let parses = variants.iter().map(|v| {
+        let tok = snake_case(&v.syn.ident.to_string());
+        let tok = Ident::new(&tok, Span::call_site());
+        let ident = &v.syn.ident;
+        quote! {
+            if p.peek::<#tok>() {
+                p.parse::<#tok>()?;
+                return Ok(Self::#ident);
+            }
+        }
+    });
+
+    let expected = format!("expected {}", ident);
+
+    quote! {
+        #[cfg(feature = "construct")]
+        impl<'a> wast::parser::Parse<'a> for #ident {
+            fn parse(p: wast::parser::Parser<'a>) -> wast::parser::Result<Self> {
+                #( #token_defs )*
+
+                #( #parses )*
+
+                Err(p.error(#expected))
+            }
+        }
+    }
+}
+
+fn create_display_impl(ident: &syn::Ident, variants: &[OperatorVariant]) -> impl quote::ToTokens {
+    let displays = variants.iter().map(|v| {
+        let variant = &v.syn.ident;
+        let snake = snake_case(&v.syn.ident.to_string());
+        quote! {
+            Self::#variant => write!(f, #snake),
+        }
+    });
+
+    quote! {
+        impl std::fmt::Display for #ident {
+            fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
+                match self {
+                    #( #displays )*
+                }
+            }
+        }
+    }
+}
+
+fn create_try_from_u32_impl(
+    ident: &syn::Ident,
+    variants: &[OperatorVariant],
+) -> impl quote::ToTokens {
+    let matches = variants.iter().map(|v| {
+        let variant = &v.syn.ident;
+        quote! {
+            x if Self::#variant as u32 == x => Ok(Self::#variant),
+        }
+    });
+
+    let error_msg = format!("value is not an `{}`", ident);
+
+    quote! {
+        impl std::convert::TryFrom<u32> for #ident {
+            type Error = &'static str;
+
+            fn try_from(value: u32) -> Result<Self, Self::Error> {
+                match value {
+                    #( #matches )*
+                    _ => Err(#error_msg)
+                }
+            }
+        }
+    }
+}
diff --git a/cranelift/peepmatic/crates/macro/src/span.rs b/cranelift/peepmatic/crates/macro/src/span.rs
new file mode 100644
index 0000000000..bdc0a63655
--- /dev/null
+++ b/cranelift/peepmatic/crates/macro/src/span.rs
@@ -0,0 +1,52 @@
+use quote::quote;
+use syn::DeriveInput;
+use syn::{parse_quote, GenericParam, Generics, Result};
+
+pub fn derive_span(input: &DeriveInput) -> Result<impl quote::ToTokens> {
+    let ty = &input.ident;
+
+    let body = match &input.data {
+        syn::Data::Struct(_) => quote! { self.span },
+        syn::Data::Enum(e) => {
+            let variants = e.variants.iter().map(|v| match v.fields {
+                syn::Fields::Unnamed(ref fields) if fields.unnamed.len() == 1 => {
+                    let variant = &v.ident;
+                    quote! { #ty::#variant(x) => x.span(), }
+                }
+                _ => panic!(
+                    "derive(Ast) on enums only supports variants with a single, unnamed field"
+                ),
+            });
+            quote! {
+                match self {
+                    #( #variants )*
+                }
+            }
+        }
+        syn::Data::Union(_) => {
+            panic!("derive(Ast) can only be used with structs and enums, not unions")
+        }
+    };
+
+    let generics = add_span_trait_bounds(input.generics.clone());
+    let (impl_generics, ty_generics, where_clause) = generics.split_for_impl();
+
+    Ok(quote! {
+        impl #impl_generics Span for #ty #ty_generics #where_clause {
+            #[inline]
+            fn span(&self) -> wast::Span {
+                #body
+            }
+        }
+    })
+}
+
+// Add a bound `T: Span` to every type parameter `T`.
+fn add_span_trait_bounds(mut generics: Generics) -> Generics {
+    for param in &mut generics.params {
+        if let GenericParam::Type(ref mut type_param) = *param {
+            type_param.bounds.push(parse_quote!(Span));
+        }
+    }
+    generics
+}
diff --git a/cranelift/peepmatic/crates/runtime/Cargo.toml b/cranelift/peepmatic/crates/runtime/Cargo.toml
new file mode 100644
index 0000000000..0a5312ed86
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/Cargo.toml
@@ -0,0 +1,24 @@
+[package]
+name = "peepmatic-runtime"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+bincode = "1.2.1"
+bumpalo = "3.2.0"
+log = "0.4.8"
+peepmatic-automata = { version = "0.1.0", path = "../automata", features = ["serde"] }
+peepmatic-macro = { version = "0.1.0", path = "../macro" }
+serde = { version = "1.0.105", features = ["derive"] }
+thiserror = "1.0.15"
+wast = { version = "15.0.0", optional = true }
+
+
+[features]
+# Enable support for a few extra methods that are required by the `peepmatic`
+# crate when constructing peephole optimizers, but are not needed when simply
+# using already-constructed peephole optimizers.
+construct = ["wast"]
diff --git a/cranelift/peepmatic/crates/runtime/src/cc.rs b/cranelift/peepmatic/crates/runtime/src/cc.rs
new file mode 100644
index 0000000000..d6cb489eab
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/cc.rs
@@ -0,0 +1,92 @@
+//! Condition codes.
+
+use serde::{Deserialize, Serialize};
+use std::convert::TryFrom;
+use std::fmt;
+
+/// A condition code.
+///
+/// This is a special kind of immediate for `icmp` instructions that dictate
+/// which parts of the comparison result we care about.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+#[repr(u32)]
+pub enum ConditionCode {
+    /// Equal.
+    // NB: We convert `ConditionCode` into `NonZeroU32`s with unchecked
+    // conversions; memory safety relies on no variant being zero.
+    Eq = 1,
+
+    /// Not equal.
+    Ne,
+
+    /// Signed less than.
+    Slt,
+
+    /// Unsigned less than.
+    Ult,
+
+    /// Signed greater than or equal.
+    Sge,
+
+    /// Unsigned greater than or equal.
+    Uge,
+
+    /// Signed greater than.
+    Sgt,
+
+    /// Unsigned greater than.
+    Ugt,
+
+    /// Signed less than or equal.
+    Sle,
+
+    /// Unsigned less than or equal.
+    Ule,
+
+    /// Overflow.
+    Of,
+
+    /// No overflow.
+    Nof,
+}
+
+impl TryFrom<u32> for ConditionCode {
+    type Error = &'static str;
+
+    fn try_from(x: u32) -> Result<Self, Self::Error> {
+        Ok(match x {
+            x if Self::Eq as u32 == x => Self::Eq,
+            x if Self::Ne as u32 == x => Self::Ne,
+            x if Self::Slt as u32 == x => Self::Slt,
+            x if Self::Ult as u32 == x => Self::Ult,
+            x if Self::Sge as u32 == x => Self::Sge,
+            x if Self::Uge as u32 == x => Self::Uge,
+            x if Self::Sgt as u32 == x => Self::Sgt,
+            x if Self::Ugt as u32 == x => Self::Ugt,
+            x if Self::Sle as u32 == x => Self::Sle,
+            x if Self::Ule as u32 == x => Self::Ule,
+            x if Self::Of as u32 == x => Self::Of,
+            x if Self::Nof as u32 == x => Self::Nof,
+            _ => return Err("not a valid condition code value"),
+        })
+    }
+}
+
+impl fmt::Display for ConditionCode {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        match self {
+            Self::Eq => write!(f, "eq"),
+            Self::Ne => write!(f, "ne"),
+            Self::Slt => write!(f, "slt"),
+            Self::Ult => write!(f, "ult"),
+            Self::Sge => write!(f, "sge"),
+            Self::Uge => write!(f, "uge"),
+            Self::Sgt => write!(f, "sgt"),
+            Self::Ugt => write!(f, "ugt"),
+            Self::Sle => write!(f, "sle"),
+            Self::Ule => write!(f, "ule"),
+            Self::Of => write!(f, "of"),
+            Self::Nof => write!(f, "nof"),
+        }
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/error.rs b/cranelift/peepmatic/crates/runtime/src/error.rs
new file mode 100644
index 0000000000..3453316238
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/error.rs
@@ -0,0 +1,44 @@
+//! `Error` and `Result` types for this crate.
+
+use std::io;
+use thiserror::Error;
+
+/// A result type containing `Ok(T)` or `Err(peepmatic_runtime::Error)`.
+pub type Result<T> = std::result::Result<T, Error>;
+
+/// Errors that `peepmatic_runtime` may generate.
+#[derive(Debug, Error)]
+#[error(transparent)]
+pub struct Error {
+    #[from]
+    inner: Box<ErrorInner>,
+}
+
+#[derive(Debug, Error)]
+enum ErrorInner {
+    #[error(transparent)]
+    Io(#[from] io::Error),
+
+    #[error(transparent)]
+    Bincode(#[from] bincode::Error),
+}
+
+impl From<io::Error> for Error {
+    fn from(e: io::Error) -> Error {
+        let e: ErrorInner = e.into();
+        e.into()
+    }
+}
+
+impl From<bincode::Error> for Error {
+    fn from(e: bincode::Error) -> Error {
+        let e: ErrorInner = e.into();
+        e.into()
+    }
+}
+
+impl From<ErrorInner> for Error {
+    fn from(e: ErrorInner) -> Error {
+        Box::new(e).into()
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/instruction_set.rs b/cranelift/peepmatic/crates/runtime/src/instruction_set.rs
new file mode 100644
index 0000000000..4d9a0752e5
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/instruction_set.rs
@@ -0,0 +1,143 @@
+//! Interfacing with actual instructions.
+
+use crate::operator::Operator;
+use crate::part::{Constant, Part};
+use crate::paths::Path;
+use crate::r#type::Type;
+use std::fmt::Debug;
+
+/// A trait for interfacing with actual instruction sequences.
+///
+/// This trait enables both:
+///
+/// * `peepmatic-runtime` to be used by `cranelift-codegen` without a circular
+///   dependency from `peepmatic-runtime` to `cranelift-codegen` to get access
+///   to Cranelift's IR types, and
+///
+/// * enables us to write local tests that exercise peephole optimizers on a
+///  simple, testing-only instruction set without pulling in all of Cranelift.
+///
+/// Finally, this should also make the task of adding support for Cranelift's
+/// new `MachInst` and vcode backend easier, since all that needs to be done is
+/// "just" implementing this trait. (And probably add/modify some
+/// `peepmatic_runtime::operation::Operation`s as well).
+///
+/// ## Safety
+///
+/// See doc comment for `instruction_result_bit_width`.
+pub unsafe trait InstructionSet<'a> {
+    /// Mutable context passed into all trait methods. Can be whatever you want!
+    ///
+    /// In practice, this is a `FuncCursor` for `cranelift-codegen`'s trait
+    /// implementation.
+    type Context;
+
+    /// An instruction (or identifier for an instruction).
+    type Instruction: Copy + Debug + Eq;
+
+    /// Replace the `old` instruction with `new`.
+    ///
+    /// `new` is either a `Part::Instruction` or a constant `Part::Boolean` or
+    /// `Part::Integer`. In the former case, it can directly replace `old`. In
+    /// the latter case, implementations of this trait should transparently
+    /// create an `iconst` or `bconst` instruction to wrap the given constant.
+    ///
+    /// `new` will never be `Part::ConditionCode`.
+    fn replace_instruction(
+        &self,
+        context: &mut Self::Context,
+        old: Self::Instruction,
+        new: Part<Self::Instruction>,
+    ) -> Self::Instruction;
+
+    /// Get the instruction, constant, or condition code at the given path.
+    ///
+    /// If there is no such entity at the given path (e.g. we run into a
+    /// function parameter and can't traverse the path any further) then `None`
+    /// should be returned.
+    fn get_part_at_path(
+        &self,
+        context: &mut Self::Context,
+        root: Self::Instruction,
+        path: Path,
+    ) -> Option<Part<Self::Instruction>>;
+
+    /// Get the given instruction's operator.
+    ///
+    /// If the instruction's opcode does not have an associated
+    /// `peepmatic_runtime::operator::Operator` variant (i.e. that instruction
+    /// isn't supported by `peepmatic` yet) then `None` should be returned.
+    fn operator(&self, context: &mut Self::Context, instr: Self::Instruction) -> Option<Operator>;
+
+    /// Make a unary instruction.
+    ///
+    /// If the type is not given, then it should be inferred.
+    fn make_inst_1(
+        &self,
+        context: &mut Self::Context,
+        root: Self::Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Self::Instruction>,
+    ) -> Self::Instruction;
+
+    /// Make a binary instruction.
+    ///
+    /// Operands are given as immediates first and arguments following
+    /// them. Condition codes are treated as immediates. So if we are creating
+    /// an `iadd_imm` instruction, then `a` will be the constant integer
+    /// immediate and `b` will be the instruction whose result is the dynamic
+    /// argument.
+    fn make_inst_2(
+        &self,
+        context: &mut Self::Context,
+        root: Self::Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Self::Instruction>,
+        b: Part<Self::Instruction>,
+    ) -> Self::Instruction;
+
+    /// Make a ternary instruction.
+    ///
+    /// Operands are given as immediates first and arguments following
+    /// them. Condition codes are treated as immediates. So if we are creating
+    /// an `icmp` instruction, then `a` will be the condition code, and `b` and
+    /// `c` will be instructions whose results are the dynamic arguments.
+    fn make_inst_3(
+        &self,
+        context: &mut Self::Context,
+        root: Self::Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Self::Instruction>,
+        b: Part<Self::Instruction>,
+        c: Part<Self::Instruction>,
+    ) -> Self::Instruction;
+
+    /// Try to resolve the given instruction into a constant value.
+    ///
+    /// If we can tell that the instruction returns a constant value, then
+    /// return that constant value as either a `Part::Boolean` or
+    /// `Part::Integer`. Otherwise, return `None`.
+    fn instruction_to_constant(
+        &self,
+        context: &mut Self::Context,
+        inst: Self::Instruction,
+    ) -> Option<Constant>;
+
+    /// Get the bit width of the given instruction's result.
+    ///
+    /// ## Safety
+    ///
+    /// There is code that makes memory-safety assumptions that the result is
+    /// always one of 1, 8, 16, 32, 64, or 128. Implementors must uphold this.
+    fn instruction_result_bit_width(
+        &self,
+        context: &mut Self::Context,
+        inst: Self::Instruction,
+    ) -> u8;
+
+    /// Get the size of a native word in bits.
+    fn native_word_size_in_bits(&self, context: &mut Self::Context) -> u8;
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/integer_interner.rs b/cranelift/peepmatic/crates/runtime/src/integer_interner.rs
new file mode 100644
index 0000000000..996100a66d
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/integer_interner.rs
@@ -0,0 +1,73 @@
+//! Interner for (potentially large) integer values.
+//!
+//! We support matching on integers that can be represented by `u64`, but only
+//! support automata results that fit in a `u32`. So we intern the (relatively
+//! few compared to the full range of `u64`) integers we are matching against
+//! here and then reference them by `IntegerId`.
+
+use serde::{Deserialize, Serialize};
+use std::collections::BTreeMap;
+use std::num::{NonZeroU16, NonZeroU32};
+
+/// An identifier for an interned integer.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct IntegerId(#[doc(hidden)] pub NonZeroU16);
+
+/// An interner for integer values.
+#[derive(Debug, Default, Serialize, Deserialize)]
+pub struct IntegerInterner {
+    // Note: we use `BTreeMap`s for deterministic serialization.
+    map: BTreeMap<u64, IntegerId>,
+    values: Vec<u64>,
+}
+
+impl IntegerInterner {
+    /// Construct a new `IntegerInterner`.
+    #[inline]
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    /// Intern a value into this `IntegerInterner`, returning its canonical
+    /// `IntegerId`.
+    #[inline]
+    pub fn intern(&mut self, value: impl Into<u64>) -> IntegerId {
+        debug_assert_eq!(self.map.len(), self.values.len());
+
+        let value = value.into();
+
+        if let Some(id) = self.map.get(&value) {
+            return *id;
+        }
+
+        assert!((self.values.len() as u64) < (std::u16::MAX as u64));
+        let id = IntegerId(unsafe { NonZeroU16::new_unchecked(self.values.len() as u16 + 1) });
+
+        self.values.push(value);
+        self.map.insert(value, id);
+        debug_assert_eq!(self.map.len(), self.values.len());
+
+        id
+    }
+
+    /// Get the id of an already-interned integer, or `None` if it has not been
+    /// interned.
+    pub fn already_interned(&self, value: impl Into<u64>) -> Option<IntegerId> {
+        let value = value.into();
+        self.map.get(&value).copied()
+    }
+
+    /// Lookup a previously interned integer by id.
+    #[inline]
+    pub fn lookup(&self, id: IntegerId) -> u64 {
+        let index = id.0.get() as usize - 1;
+        self.values[index]
+    }
+}
+
+impl From<IntegerId> for NonZeroU32 {
+    #[inline]
+    fn from(id: IntegerId) -> NonZeroU32 {
+        id.0.into()
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/lib.rs b/cranelift/peepmatic/crates/runtime/src/lib.rs
new file mode 100755
index 0000000000..ae45c42f2b
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/lib.rs
@@ -0,0 +1,34 @@
+//! Runtime support for `peepmatic`'s peephole optimizers.
+//!
+//! This crate contains everything required to use a `peepmatic`-generated
+//! peephole optimizer.
+//!
+//! ## Why is this a different crate from `peepmatic`?
+//!
+//! In short: build times and code size.
+//!
+//! If you are just using a peephole optimizer, you shouldn't need the functions
+//! to construct it from scratch from the DSL (and the implied code size and
+//! compilation time), let alone even build it at all. You should just
+//! deserialize an already-built peephole optimizer, and then use it.
+//!
+//! That's all that is contained here in this crate.
+
+#![deny(missing_docs)]
+#![deny(missing_debug_implementations)]
+
+pub mod cc;
+pub mod error;
+pub mod instruction_set;
+pub mod integer_interner;
+pub mod linear;
+pub mod operator;
+pub mod optimizations;
+pub mod optimizer;
+pub mod part;
+pub mod paths;
+pub mod r#type;
+
+pub use error::{Error, Result};
+pub use optimizations::PeepholeOptimizations;
+pub use optimizer::PeepholeOptimizer;
diff --git a/cranelift/peepmatic/crates/runtime/src/linear.rs b/cranelift/peepmatic/crates/runtime/src/linear.rs
new file mode 100644
index 0000000000..f156311740
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/linear.rs
@@ -0,0 +1,264 @@
+//! A linear IR for optimizations.
+//!
+//! This IR is designed such that it should be easy to combine multiple linear
+//! optimizations into a single automata.
+//!
+//! See also `src/linearize.rs` for the AST to linear IR translation pass.
+
+use crate::cc::ConditionCode;
+use crate::integer_interner::{IntegerId, IntegerInterner};
+use crate::operator::{Operator, UnquoteOperator};
+use crate::paths::{PathId, PathInterner};
+use crate::r#type::{BitWidth, Type};
+use serde::{Deserialize, Serialize};
+use std::num::NonZeroU32;
+
+/// A set of linear optimizations.
+#[derive(Debug)]
+pub struct Optimizations {
+    /// The linear optimizations.
+    pub optimizations: Vec<Optimization>,
+
+    /// The de-duplicated paths referenced by these optimizations.
+    pub paths: PathInterner,
+
+    /// The integer literals referenced by these optimizations.
+    pub integers: IntegerInterner,
+}
+
+/// A linearized optimization.
+#[derive(Clone, Debug, PartialEq, Eq)]
+pub struct Optimization {
+    /// The chain of increments for this optimization.
+    pub increments: Vec<Increment>,
+}
+
+/// Match any value.
+///
+/// This can be used to create fallback, wildcard-style transitions between
+/// states.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct Else;
+
+/// The result of evaluating a `MatchOp`.
+///
+/// This is either a specific non-zero `u32`, or a fallback that matches
+/// everything.
+pub type MatchResult = Result<NonZeroU32, Else>;
+
+/// Convert a boolean to a `MatchResult`.
+#[inline]
+pub fn bool_to_match_result(b: bool) -> MatchResult {
+    let b = b as u32;
+    unsafe { Ok(NonZeroU32::new_unchecked(b + 1)) }
+}
+
+/// A partial match of an optimization's LHS and partial construction of its
+/// RHS.
+///
+/// An increment is a matching operation, the expected result from that
+/// operation to continue to the next increment, and the actions to take to
+/// build up the LHS scope and RHS instructions given that we got the expected
+/// result from this increment's matching operation. Each increment will
+/// basically become a state and a transition edge out of that state in the
+/// final automata.
+#[derive(Clone, Debug, PartialEq, Eq)]
+pub struct Increment {
+    /// The matching operation to perform.
+    pub operation: MatchOp,
+
+    /// The expected result of our matching operation, that enables us to
+    /// continue to the next increment, or `Else` for "don't care"
+    /// wildcard-style matching.
+    pub expected: MatchResult,
+
+    /// Actions to perform, given that the operation resulted in the expected
+    /// value.
+    pub actions: Vec<Action>,
+}
+
+/// A matching operation to be performed on some Cranelift instruction as part
+/// of determining whether an optimization is applicable.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Deserialize, Serialize)]
+pub enum MatchOp {
+    /// Switch on the opcode of an instruction.
+    Opcode {
+        /// The path to the instruction whose opcode we're switching on.
+        path: PathId,
+    },
+
+    /// Does an instruction have a constant value?
+    IsConst {
+        /// The path to the instruction (or immediate) that we're checking
+        /// whether it is constant or not.
+        path: PathId,
+    },
+
+    /// Is the constant value a power of two?
+    IsPowerOfTwo {
+        /// The path to the instruction (or immediate) that we are checking
+        /// whether it is a constant power of two or not.
+        path: PathId,
+    },
+
+    /// Switch on the bit width of a value.
+    BitWidth {
+        /// The path to the instruction (or immediate) whose result's bit width
+        /// we are checking.
+        path: PathId,
+    },
+
+    /// Does the value fit in our target architecture's native word size?
+    FitsInNativeWord {
+        /// The path to the instruction (or immediate) whose result we are
+        /// checking whether it fits in a native word or not.
+        path: PathId,
+    },
+
+    /// Are the instructions (or immediates) at the given paths the same?
+    Eq {
+        /// The path to the first instruction (or immediate).
+        path_a: PathId,
+        /// The path to the second instruction (or immediate).
+        path_b: PathId,
+    },
+
+    /// Switch on the constant integer value of an instruction.
+    IntegerValue {
+        /// The path to the instruction.
+        path: PathId,
+    },
+
+    /// Switch on the constant boolean value of an instruction.
+    BooleanValue {
+        /// The path to the instruction.
+        path: PathId,
+    },
+
+    /// Switch on a condition code.
+    ConditionCode {
+        /// The path to the condition code.
+        path: PathId,
+    },
+
+    /// No operation. Always evaluates to `None`.
+    ///
+    /// Exceedingly rare in real optimizations; nonetheless required to support
+    /// corner cases of the DSL, such as a LHS pattern that is nothing but a
+    /// variable pattern.
+    Nop,
+}
+
+/// A canonicalized identifier for a left-hand side value that was bound in a
+/// pattern.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, Serialize, Deserialize)]
+pub struct LhsId(pub u16);
+
+/// A canonicalized identifier for a right-hand side value.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct RhsId(pub u16);
+
+/// An action to perform when transitioning between states in the automata.
+///
+/// When evaluating actions, the `i^th` action implicitly defines the
+/// `RhsId(i)`.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub enum Action {
+    /// Reuse something from the left-hand side.
+    GetLhs {
+        /// The path to the instruction or value.
+        path: PathId,
+    },
+
+    /// Perform compile-time evaluation.
+    UnaryUnquote {
+        /// The unquote operator.
+        operator: UnquoteOperator,
+        /// The constant operand to this unquote.
+        operand: RhsId,
+    },
+
+    /// Perform compile-time evaluation.
+    BinaryUnquote {
+        /// The unquote operator.
+        operator: UnquoteOperator,
+        /// The constant operands to this unquote.
+        operands: [RhsId; 2],
+    },
+
+    /// Create an integer constant.
+    MakeIntegerConst {
+        /// The constant integer value.
+        value: IntegerId,
+        /// The bit width of this constant.
+        bit_width: BitWidth,
+    },
+
+    /// Create a boolean constant.
+    MakeBooleanConst {
+        /// The constant boolean value.
+        value: bool,
+        /// The bit width of this constant.
+        bit_width: BitWidth,
+    },
+
+    /// Create a condition code.
+    MakeConditionCode {
+        /// The condition code.
+        cc: ConditionCode,
+    },
+
+    /// Make a unary instruction.
+    MakeUnaryInst {
+        /// The operand for this instruction.
+        operand: RhsId,
+        /// The type of this instruction's result.
+        r#type: Type,
+        /// The operator for this instruction.
+        operator: Operator,
+    },
+
+    /// Make a binary instruction.
+    MakeBinaryInst {
+        /// The opcode for this instruction.
+        operator: Operator,
+        /// The type of this instruction's result.
+        r#type: Type,
+        /// The operands for this instruction.
+        operands: [RhsId; 2],
+    },
+
+    /// Make a ternary instruction.
+    MakeTernaryInst {
+        /// The opcode for this instruction.
+        operator: Operator,
+        /// The type of this instruction's result.
+        r#type: Type,
+        /// The operands for this instruction.
+        operands: [RhsId; 3],
+    },
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    // These types all end up in the automaton, so we should take care that they
+    // are small and don't fill up the data cache (or take up too much
+    // serialized size).
+
+    #[test]
+    fn match_result_size() {
+        assert_eq!(std::mem::size_of::<MatchResult>(), 4);
+    }
+
+    #[test]
+    fn match_op_size() {
+        assert_eq!(std::mem::size_of::<MatchOp>(), 6);
+    }
+
+    #[test]
+    fn action_size() {
+        assert_eq!(std::mem::size_of::<Action>(), 16);
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/operator.rs b/cranelift/peepmatic/crates/runtime/src/operator.rs
new file mode 100644
index 0000000000..c8f06b8514
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/operator.rs
@@ -0,0 +1,298 @@
+//! Operator definitions.
+
+use peepmatic_macro::PeepmaticOperator;
+use serde::{Deserialize, Serialize};
+
+/// An operator.
+///
+/// These are a subset of Cranelift IR's operators.
+///
+/// ## Caveats for Branching and Trapping Operators
+///
+/// Branching operators are not fully modeled: we do not represent their label
+/// and jump arguments. It is up to the interpreter doing the instruction
+/// replacement to recognize when we are replacing one branch with another, and
+/// copy over the extra information.
+///
+/// Affected operations: `brz`, `brnz`, `trapz`, `trapnz`.
+#[derive(PeepmaticOperator, Clone, Copy, PartialEq, Eq, Hash, Debug, Serialize, Deserialize)]
+#[repr(u32)]
+pub enum Operator {
+    /// `adjust_sp_down`
+    #[peepmatic(params(iNN), result(void))]
+    // NB: We convert `Operator`s into `NonZeroU32`s with unchecked casts;
+    // memory safety relies on `Operator` starting at `1` and no variant ever
+    // being zero.
+    AdjustSpDown = 1,
+
+    /// `adjust_sp_down_imm`
+    #[peepmatic(immediates(iNN), result(void))]
+    AdjustSpDownImm,
+
+    /// `band`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Band,
+
+    /// `band_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    BandImm,
+
+    /// `bconst`
+    #[peepmatic(immediates(b1), result(bNN))]
+    Bconst,
+
+    /// `bint`
+    #[peepmatic(params(bNN), result(iNN))]
+    Bint,
+
+    /// `bor`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Bor,
+
+    /// `bor_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    BorImm,
+
+    /// `brnz`
+    #[peepmatic(params(bool_or_int), result(void))]
+    Brnz,
+
+    /// `brz`
+    #[peepmatic(params(bool_or_int), result(void))]
+    Brz,
+
+    /// `bxor`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Bxor,
+
+    /// `bxor_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    BxorImm,
+
+    /// `iadd`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Iadd,
+
+    /// `iadd_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    IaddImm,
+
+    /// `icmp`
+    #[peepmatic(immediates(cc), params(iNN, iNN), result(b1))]
+    Icmp,
+
+    /// `icmp_imm`
+    #[peepmatic(immediates(cc, iNN), params(iNN), result(b1))]
+    IcmpImm,
+
+    /// `iconst`
+    #[peepmatic(immediates(iNN), result(iNN))]
+    Iconst,
+
+    /// `ifcmp`
+    #[peepmatic(params(iNN, iNN), result(cpu_flags))]
+    Ifcmp,
+
+    /// `ifcmp_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(cpu_flags))]
+    IfcmpImm,
+
+    /// `imul`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Imul,
+
+    /// `imul_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    ImulImm,
+
+    /// `ireduce`
+    #[peepmatic(params(iNN), result(iMM))]
+    Ireduce,
+
+    /// `irsub_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    IrsubImm,
+
+    /// `ishl`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Ishl,
+
+    /// `ishl_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    IshlImm,
+
+    /// `isub`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Isub,
+
+    /// `rotl`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Rotl,
+
+    /// `rotl_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    RotlImm,
+
+    /// `rotr`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Rotr,
+
+    /// `rotr_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    RotrImm,
+
+    /// `sdiv`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Sdiv,
+
+    /// `sdiv_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    SdivImm,
+
+    /// `select`
+    #[peepmatic(params(bool_or_int, any_t, any_t), result(any_t))]
+    Select,
+
+    /// `sextend`
+    #[peepmatic(params(iNN), result(iMM))]
+    Sextend,
+
+    /// `srem`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Srem,
+
+    /// `srem_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    SremImm,
+
+    /// `sshr`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Sshr,
+
+    /// `sshr_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    SshrImm,
+
+    /// `trapnz`
+    #[peepmatic(params(bool_or_int), result(void))]
+    Trapnz,
+
+    /// `trapz`
+    #[peepmatic(params(bool_or_int), result(void))]
+    Trapz,
+
+    /// `udiv`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Udiv,
+
+    /// `udiv_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    UdivImm,
+
+    /// `uextend`
+    #[peepmatic(params(iNN), result(iMM))]
+    Uextend,
+
+    /// `urem`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Urem,
+
+    /// `urem_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    UremImm,
+
+    /// `ushr`
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Ushr,
+
+    /// `ushr_imm`
+    #[peepmatic(immediates(iNN), params(iNN), result(iNN))]
+    UshrImm,
+}
+
+/// Compile-time unquote operators.
+///
+/// These are used in the right-hand side to perform compile-time evaluation of
+/// constants matched on the left-hand side.
+#[derive(PeepmaticOperator, Clone, Copy, PartialEq, Eq, Hash, Debug, Serialize, Deserialize)]
+#[repr(u32)]
+pub enum UnquoteOperator {
+    /// Compile-time `band` of two constant values.
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Band,
+
+    /// Compile-time `bor` of two constant values.
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Bor,
+
+    /// Compile-time `bxor` of two constant values.
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Bxor,
+
+    /// Compile-time `iadd` of two constant values.
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Iadd,
+
+    /// Compile-time `imul` of two constant values.
+    #[peepmatic(params(iNN, iNN), result(iNN))]
+    Imul,
+
+    /// Take the base-2 log of a power of two integer.
+    #[peepmatic(params(iNN), result(iNN))]
+    Log2,
+
+    /// Wrapping negation of an integer.
+    #[peepmatic(params(iNN), result(iNN))]
+    Neg,
+}
+
+/// A trait to represent a typing context.
+///
+/// This is used by the macro-generated operator methods that create the type
+/// variables for their immediates, parameters, and results. This trait is
+/// implemented by the concrete typing context in `peepmatic/src/verify.rs`.
+#[cfg(feature = "construct")]
+pub trait TypingContext<'a> {
+    /// A type variable.
+    type TypeVariable;
+
+    /// Create a condition code type.
+    fn cc(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create a boolean type with a polymorphic bit width.
+    ///
+    /// Each use of `bNN` by the same operator refers to the same type variable.
+    #[allow(non_snake_case)]
+    fn bNN(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create an integer type with a polymorphic bit width.
+    ///
+    /// Each use of `iNN` by the same operator refers to the same type variable.
+    #[allow(non_snake_case)]
+    fn iNN(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create an integer type with a polymorphic bit width.
+    ///
+    /// Each use of `iMM` by the same operator refers to the same type variable.
+    #[allow(non_snake_case)]
+    fn iMM(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create the CPU flags type variable.
+    fn cpu_flags(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create a boolean type of size one bit.
+    fn b1(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create the void type, used as the result of operators that branch away,
+    /// or do not return anything.
+    fn void(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create a type variable that may be either a boolean or an integer.
+    fn bool_or_int(&mut self, span: wast::Span) -> Self::TypeVariable;
+
+    /// Create a type variable that can be any type T.
+    ///
+    /// Each use of `any_t` by the same operator refers to the same type
+    /// variable.
+    fn any_t(&mut self, span: wast::Span) -> Self::TypeVariable;
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/optimizations.rs b/cranelift/peepmatic/crates/runtime/src/optimizations.rs
new file mode 100644
index 0000000000..ff838ff720
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/optimizations.rs
@@ -0,0 +1,74 @@
+//! Compiled peephole optimizations.
+
+use crate::error::Result;
+use crate::instruction_set::InstructionSet;
+use crate::integer_interner::IntegerInterner;
+use crate::linear::{Action, MatchOp, MatchResult};
+use crate::optimizer::PeepholeOptimizer;
+use crate::paths::PathInterner;
+use peepmatic_automata::Automaton;
+use serde::{Deserialize, Serialize};
+
+#[cfg(feature = "construct")]
+use std::fs;
+#[cfg(feature = "construct")]
+use std::path::Path;
+
+/// A compiled set of peephole optimizations.
+///
+/// This is the compilation result of the `peepmatic` crate, after its taken a
+/// bunch of optimizations written in the DSL and lowered and combined them.
+#[derive(Debug, Serialize, Deserialize)]
+pub struct PeepholeOptimizations {
+    /// The instruction paths referenced by the peephole optimizations.
+    pub paths: PathInterner,
+
+    /// Not all integers we're matching on fit in the `u32` that we use as the
+    /// result of match operations. So we intern them and refer to them by id.
+    pub integers: IntegerInterner,
+
+    /// The underlying automata for matching optimizations' left-hand sides, and
+    /// building up the corresponding right-hand side.
+    pub automata: Automaton<MatchResult, MatchOp, Box<[Action]>>,
+}
+
+impl PeepholeOptimizations {
+    /// Deserialize a `PeepholeOptimizations` from bytes.
+    pub fn deserialize(serialized: &[u8]) -> Result<Self> {
+        let peep_opt: Self = bincode::deserialize(serialized)?;
+        Ok(peep_opt)
+    }
+
+    /// Serialize these peephole optimizations out to the file at the given path.
+    ///
+    /// Requires that the `"construct"` cargo feature is enabled.
+    #[cfg(feature = "construct")]
+    pub fn serialize_to_file(&self, path: &Path) -> Result<()> {
+        let file = fs::File::create(path)?;
+        bincode::serialize_into(file, self)?;
+        Ok(())
+    }
+
+    /// Create a new peephole optimizer instance from this set of peephole
+    /// optimizations.
+    ///
+    /// The peephole optimizer instance can be used to apply these peephole
+    /// optimizations. When checking multiple instructions for whether they can
+    /// be optimized, it is more performant to reuse a single peephole optimizer
+    /// instance, rather than create a new one for each instruction. Reusing the
+    /// peephole optimizer instance allows the reuse of a few internal
+    /// allocations.
+    pub fn optimizer<'peep, 'ctx, I>(&'peep self, instr_set: I) -> PeepholeOptimizer<'peep, 'ctx, I>
+    where
+        I: InstructionSet<'ctx>,
+    {
+        PeepholeOptimizer {
+            peep_opt: self,
+            instr_set,
+            left_hand_sides: vec![],
+            right_hand_sides: vec![],
+            actions: vec![],
+            backtracking_states: vec![],
+        }
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/optimizer.rs b/cranelift/peepmatic/crates/runtime/src/optimizer.rs
new file mode 100644
index 0000000000..2cbf823a4b
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/optimizer.rs
@@ -0,0 +1,580 @@
+//! An optimizer for a set of peephole optimizations.
+
+use crate::instruction_set::InstructionSet;
+use crate::linear::{bool_to_match_result, Action, Else, MatchOp, MatchResult};
+use crate::operator::UnquoteOperator;
+use crate::optimizations::PeepholeOptimizations;
+use crate::part::{Constant, Part};
+use crate::r#type::{BitWidth, Type};
+use peepmatic_automata::State;
+use std::convert::TryFrom;
+use std::fmt::{self, Debug};
+use std::mem;
+use std::num::NonZeroU32;
+
+/// A peephole optimizer instance that can apply a set of peephole
+/// optimizations to instructions.
+///
+/// These are created from a set of peephole optimizations with the
+/// [`PeepholeOptimizer::instance`][crate::PeepholeOptimizer::instance] method.
+///
+/// Reusing an instance when applying peephole optimizations to different
+/// instruction sequences means that you reuse internal allocations that are
+/// used to match left-hand sides and build up right-hand sides.
+pub struct PeepholeOptimizer<'peep, 'ctx, I>
+where
+    I: InstructionSet<'ctx>,
+{
+    pub(crate) peep_opt: &'peep PeepholeOptimizations,
+    pub(crate) instr_set: I,
+    pub(crate) left_hand_sides: Vec<Part<I::Instruction>>,
+    pub(crate) right_hand_sides: Vec<Part<I::Instruction>>,
+    pub(crate) actions: Vec<Action>,
+    pub(crate) backtracking_states: Vec<(State, usize)>,
+}
+
+impl<'peep, 'ctx, I> Debug for PeepholeOptimizer<'peep, 'ctx, I>
+where
+    I: InstructionSet<'ctx>,
+{
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        let PeepholeOptimizer {
+            peep_opt,
+            instr_set: _,
+            left_hand_sides,
+            right_hand_sides,
+            actions,
+            backtracking_states,
+        } = self;
+        f.debug_struct("PeepholeOptimizer")
+            .field("peep_opt", peep_opt)
+            .field("instr_set", &"_")
+            .field("left_hand_sides", left_hand_sides)
+            .field("right_hand_sides", right_hand_sides)
+            .field("actions", actions)
+            .field("backtracking_states", backtracking_states)
+            .finish()
+    }
+}
+
+impl<'peep, 'ctx, I> PeepholeOptimizer<'peep, 'ctx, I>
+where
+    I: InstructionSet<'ctx>,
+{
+    fn eval_unquote_1(&self, operator: UnquoteOperator, a: Constant) -> Constant {
+        use Constant::*;
+
+        macro_rules! map_int {
+            ( $c:expr , | $x:ident | $e:expr ) => {
+                match $c {
+                    Int($x, w) => Int($e, w),
+                    Bool(..) => panic!("not an integer"),
+                }
+            };
+        }
+
+        match operator {
+            UnquoteOperator::Log2 => map_int!(a, |x| x.trailing_zeros() as _),
+            UnquoteOperator::Neg => map_int!(a, |x| x.wrapping_neg()),
+            UnquoteOperator::Band
+            | UnquoteOperator::Bor
+            | UnquoteOperator::Bxor
+            | UnquoteOperator::Iadd
+            | UnquoteOperator::Imul => unreachable!("not a unary unquote operator: {:?}", operator),
+        }
+    }
+
+    fn eval_unquote_2(&self, operator: UnquoteOperator, a: Constant, b: Constant) -> Constant {
+        use Constant::*;
+
+        macro_rules! fold_ints {
+            ( $c1:expr , $c2:expr , | $x:ident , $y:ident | $e:expr ) => {
+                match ($c1, $c2) {
+                    (Int($x, w1), Int($y, w2)) if w1 == w2 => Int($e, w1),
+                    _ => panic!("not two integers of the same width"),
+                }
+            };
+        }
+
+        match operator {
+            UnquoteOperator::Band => fold_ints!(a, b, |x, y| x & y),
+            UnquoteOperator::Bor => fold_ints!(a, b, |x, y| x | y),
+            UnquoteOperator::Bxor => fold_ints!(a, b, |x, y| x ^ y),
+            UnquoteOperator::Iadd => fold_ints!(a, b, |x, y| x.wrapping_add(y)),
+            UnquoteOperator::Imul => fold_ints!(a, b, |x, y| x.wrapping_mul(y)),
+            UnquoteOperator::Log2 | UnquoteOperator::Neg => {
+                unreachable!("not a binary unquote operator: {:?}", operator)
+            }
+        }
+    }
+
+    fn eval_actions(&mut self, context: &mut I::Context, root: I::Instruction) {
+        let mut actions = mem::replace(&mut self.actions, vec![]);
+
+        for action in actions.drain(..) {
+            log::trace!("Evaluating action: {:?}", action);
+            match action {
+                Action::GetLhs { path } => {
+                    let path = self.peep_opt.paths.lookup(path);
+                    let lhs = self
+                        .instr_set
+                        .get_part_at_path(context, root, path)
+                        .expect("should always get part at path OK by the time it is bound");
+                    self.right_hand_sides.push(lhs);
+                }
+                Action::UnaryUnquote { operator, operand } => {
+                    let operand = self.right_hand_sides[operand.0 as usize];
+                    let operand = match operand {
+                        Part::Instruction(i) => self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .expect("cannot convert instruction to constant for unquote operand"),
+                        Part::Constant(c) => c,
+                        Part::ConditionCode(_) => {
+                            panic!("cannot use a condition code as an unquote operand")
+                        }
+                    };
+                    let result = self.eval_unquote_1(operator, operand);
+                    self.right_hand_sides.push(result.into());
+                }
+                Action::BinaryUnquote { operator, operands } => {
+                    let a = self.right_hand_sides[operands[0].0 as usize];
+                    let a = match a {
+                        Part::Instruction(i) => self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .expect("cannot convert instruction to constant for unquote operand"),
+                        Part::Constant(c) => c,
+                        Part::ConditionCode(_) => {
+                            panic!("cannot use a condition code as an unquote operand")
+                        }
+                    };
+
+                    let b = self.right_hand_sides[operands[1].0 as usize];
+                    let b = match b {
+                        Part::Instruction(i) => self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .expect("cannot convert instruction to constant for unquote operand"),
+                        Part::Constant(c) => c,
+                        Part::ConditionCode(_) => {
+                            panic!("cannot use a condition code as an unquote operand")
+                        }
+                    };
+
+                    let result = self.eval_unquote_2(operator, a, b);
+                    self.right_hand_sides.push(result.into());
+                }
+                Action::MakeIntegerConst {
+                    value,
+                    mut bit_width,
+                } => {
+                    let value = self.peep_opt.integers.lookup(value);
+                    if bit_width.is_polymorphic() {
+                        bit_width = BitWidth::try_from(
+                            self.instr_set.instruction_result_bit_width(context, root),
+                        )
+                        .unwrap();
+                    }
+                    self.right_hand_sides
+                        .push(Constant::Int(value, bit_width).into());
+                }
+                Action::MakeBooleanConst {
+                    value,
+                    mut bit_width,
+                } => {
+                    if bit_width.is_polymorphic() {
+                        bit_width = BitWidth::try_from(
+                            self.instr_set.instruction_result_bit_width(context, root),
+                        )
+                        .unwrap();
+                    }
+                    self.right_hand_sides
+                        .push(Constant::Bool(value, bit_width).into());
+                }
+                Action::MakeConditionCode { cc } => {
+                    self.right_hand_sides.push(Part::ConditionCode(cc));
+                }
+                Action::MakeUnaryInst {
+                    operator,
+                    r#type:
+                        Type {
+                            kind,
+                            mut bit_width,
+                        },
+                    operand,
+                } => {
+                    if bit_width.is_polymorphic() {
+                        bit_width = BitWidth::try_from(
+                            self.instr_set.instruction_result_bit_width(context, root),
+                        )
+                        .unwrap();
+                    }
+                    let ty = Type { kind, bit_width };
+                    let operand = self.right_hand_sides[operand.0 as usize];
+                    let inst = self
+                        .instr_set
+                        .make_inst_1(context, root, operator, ty, operand);
+                    self.right_hand_sides.push(Part::Instruction(inst));
+                }
+                Action::MakeBinaryInst {
+                    operator,
+                    r#type:
+                        Type {
+                            kind,
+                            mut bit_width,
+                        },
+                    operands,
+                } => {
+                    if bit_width.is_polymorphic() {
+                        bit_width = BitWidth::try_from(
+                            self.instr_set.instruction_result_bit_width(context, root),
+                        )
+                        .unwrap();
+                    }
+                    let ty = Type { kind, bit_width };
+                    let a = self.right_hand_sides[operands[0].0 as usize];
+                    let b = self.right_hand_sides[operands[1].0 as usize];
+                    let inst = self
+                        .instr_set
+                        .make_inst_2(context, root, operator, ty, a, b);
+                    self.right_hand_sides.push(Part::Instruction(inst));
+                }
+                Action::MakeTernaryInst {
+                    operator,
+                    r#type:
+                        Type {
+                            kind,
+                            mut bit_width,
+                        },
+                    operands,
+                } => {
+                    if bit_width.is_polymorphic() {
+                        bit_width = BitWidth::try_from(
+                            self.instr_set.instruction_result_bit_width(context, root),
+                        )
+                        .unwrap();
+                    }
+                    let ty = Type { kind, bit_width };
+                    let a = self.right_hand_sides[operands[0].0 as usize];
+                    let b = self.right_hand_sides[operands[1].0 as usize];
+                    let c = self.right_hand_sides[operands[2].0 as usize];
+                    let inst = self
+                        .instr_set
+                        .make_inst_3(context, root, operator, ty, a, b, c);
+                    self.right_hand_sides.push(Part::Instruction(inst));
+                }
+            }
+        }
+
+        // Reuse the heap elements allocation.
+        self.actions = actions;
+    }
+
+    fn eval_match_op(
+        &mut self,
+        context: &mut I::Context,
+        root: I::Instruction,
+        match_op: MatchOp,
+    ) -> MatchResult {
+        use crate::linear::MatchOp::*;
+
+        log::trace!("Evaluating match operation: {:?}", match_op);
+        let result: MatchResult = (|| match match_op {
+            Opcode { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                let inst = part.as_instruction().ok_or(Else)?;
+                let op = self.instr_set.operator(context, inst).ok_or(Else)?;
+                let op = op as u32;
+                debug_assert!(
+                    op != 0,
+                    "`Operator` doesn't have any variant represented
+        with zero"
+                );
+                Ok(unsafe { NonZeroU32::new_unchecked(op as u32) })
+            }
+            IsConst { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                let is_const = match part {
+                    Part::Instruction(i) => {
+                        self.instr_set.instruction_to_constant(context, i).is_some()
+                    }
+                    Part::ConditionCode(_) | Part::Constant(_) => true,
+                };
+                bool_to_match_result(is_const)
+            }
+            IsPowerOfTwo { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                match part {
+                    Part::Constant(c) => {
+                        let is_pow2 = c.as_int().unwrap().is_power_of_two();
+                        bool_to_match_result(is_pow2)
+                    }
+                    Part::Instruction(i) => {
+                        let c = self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .ok_or(Else)?;
+                        let is_pow2 = c.as_int().unwrap().is_power_of_two();
+                        bool_to_match_result(is_pow2)
+                    }
+                    Part::ConditionCode(_) => unreachable!(
+                        "IsPowerOfTwo on a condition
+        code"
+                    ),
+                }
+            }
+            BitWidth { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                let bit_width = match part {
+                    Part::Instruction(i) => self.instr_set.instruction_result_bit_width(context, i),
+                    Part::Constant(Constant::Int(_, w)) | Part::Constant(Constant::Bool(_, w)) => {
+                        w.fixed_width().unwrap_or_else(|| {
+                            self.instr_set.instruction_result_bit_width(context, root)
+                        })
+                    }
+                    Part::ConditionCode(_) => panic!("BitWidth on condition code"),
+                };
+                debug_assert!(
+                    bit_width != 0,
+                    "`InstructionSet` implementors must uphold the contract that \
+                     `instruction_result_bit_width` returns one of 1, 8, 16, 32, 64, or 128"
+                );
+                Ok(unsafe { NonZeroU32::new_unchecked(bit_width as u32) })
+            }
+            FitsInNativeWord { path } => {
+                let native_word_size = self.instr_set.native_word_size_in_bits(context);
+                debug_assert!(native_word_size.is_power_of_two());
+
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                let fits = match part {
+                    Part::Instruction(i) => {
+                        let size = self.instr_set.instruction_result_bit_width(context, i);
+                        size <= native_word_size
+                    }
+                    Part::Constant(c) => {
+                        let root_width = self.instr_set.instruction_result_bit_width(context, root);
+                        let size = c.bit_width(root_width);
+                        size <= native_word_size
+                    }
+                    Part::ConditionCode(_) => panic!("FitsInNativeWord on condition code"),
+                };
+                bool_to_match_result(fits)
+            }
+            Eq { path_a, path_b } => {
+                let path_a = self.peep_opt.paths.lookup(path_a);
+                let part_a = self
+                    .instr_set
+                    .get_part_at_path(context, root, path_a)
+                    .ok_or(Else)?;
+                let path_b = self.peep_opt.paths.lookup(path_b);
+                let part_b = self
+                    .instr_set
+                    .get_part_at_path(context, root, path_b)
+                    .ok_or(Else)?;
+                let eq = match (part_a, part_b) {
+                    (Part::Instruction(inst), Part::Constant(c1))
+                    | (Part::Constant(c1), Part::Instruction(inst)) => {
+                        match self.instr_set.instruction_to_constant(context, inst) {
+                            Some(c2) => c1 == c2,
+                            None => false,
+                        }
+                    }
+                    (a, b) => a == b,
+                };
+                bool_to_match_result(eq)
+            }
+            IntegerValue { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                match part {
+                    Part::Constant(c) => {
+                        let x = c.as_int().ok_or(Else)?;
+                        let id = self.peep_opt.integers.already_interned(x).ok_or(Else)?;
+                        Ok(id.into())
+                    }
+                    Part::Instruction(i) => {
+                        let c = self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .ok_or(Else)?;
+                        let x = c.as_int().ok_or(Else)?;
+                        let id = self.peep_opt.integers.already_interned(x).ok_or(Else)?;
+                        Ok(id.into())
+                    }
+                    Part::ConditionCode(_) => unreachable!("IntegerValue on condition code"),
+                }
+            }
+            BooleanValue { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                match part {
+                    Part::Constant(c) => {
+                        let b = c.as_bool().ok_or(Else)?;
+                        bool_to_match_result(b)
+                    }
+                    Part::Instruction(i) => {
+                        let c = self
+                            .instr_set
+                            .instruction_to_constant(context, i)
+                            .ok_or(Else)?;
+                        let b = c.as_bool().ok_or(Else)?;
+                        bool_to_match_result(b)
+                    }
+                    Part::ConditionCode(_) => unreachable!("IntegerValue on condition code"),
+                }
+            }
+            ConditionCode { path } => {
+                let path = self.peep_opt.paths.lookup(path);
+                let part = self
+                    .instr_set
+                    .get_part_at_path(context, root, path)
+                    .ok_or(Else)?;
+                let cc = part.as_condition_code().ok_or(Else)?;
+                let cc = cc as u32;
+                debug_assert!(cc != 0);
+                Ok(unsafe { NonZeroU32::new_unchecked(cc) })
+            }
+            MatchOp::Nop => Err(Else),
+        })();
+        log::trace!("Evaluated match operation: {:?} = {:?}", match_op, result);
+        result
+    }
+
+    /// Attempt to apply a single peephole optimization to the given root
+    /// instruction.
+    ///
+    /// If an optimization is applied, then the `root` is replaced with the
+    /// optimization's right-hand side, and the root of the right-hand side is
+    /// returned as `Some`.
+    ///
+    /// If no optimization's left-hand side matches `root`, then `root` is left
+    /// untouched and `None` is returned.
+    pub fn apply_one(
+        &mut self,
+        context: &mut I::Context,
+        root: I::Instruction,
+    ) -> Option<I::Instruction> {
+        log::trace!("PeepholeOptimizer::apply_one");
+
+        self.backtracking_states.clear();
+        self.actions.clear();
+        self.left_hand_sides.clear();
+        self.right_hand_sides.clear();
+
+        let mut r#final = None;
+
+        let mut query = self.peep_opt.automata.query();
+        loop {
+            log::trace!("Current state: {:?}", query.current_state());
+
+            if query.is_in_final_state() {
+                // If we're in a final state (which means an optimization is
+                // applicable) then record that fact, but keep going. We don't
+                // want to stop yet, because we might discover another,
+                // more-specific optimization that is also applicable if we keep
+                // going. And we always want to apply the most specific
+                // optimization that matches.
+                log::trace!("Found a match at state {:?}", query.current_state());
+                r#final = Some((query.current_state(), self.actions.len()));
+            }
+
+            // Anything following a `Else` transition doesn't care about the
+            // result of this match operation, so if we partially follow the
+            // current non-`Else` path, but don't ultimately find a matching
+            // optimization, we want to be able to backtrack to this state and
+            // then try taking the `Else` transition.
+            if query.has_transition_on(&Err(Else)) {
+                self.backtracking_states
+                    .push((query.current_state(), self.actions.len()));
+            }
+
+            let match_op = match query.current_state_data() {
+                None => break,
+                Some(op) => op,
+            };
+
+            let input = self.eval_match_op(context, root, *match_op);
+
+            let actions = if let Some(actions) = query.next(&input) {
+                actions
+            } else if r#final.is_some() {
+                break;
+            } else if let Some((state, actions_len)) = self.backtracking_states.pop() {
+                query.go_to_state(state);
+                self.actions.truncate(actions_len);
+                query
+                    .next(&Err(Else))
+                    .expect("backtracking states always have `Else` transitions")
+            } else {
+                break;
+            };
+
+            self.actions.extend(actions.iter().copied());
+        }
+
+        // If `final` is none, then we didn't encounter any final states, so
+        // there are no applicable optimizations.
+        let (final_state, actions_len) = match r#final {
+            Some(f) => f,
+            None => {
+                log::trace!("No optimizations matched");
+                return None;
+            }
+        };
+
+        // Go to the last final state we saw, reset the LHS and RHS to how
+        // they were at the time we saw the final state, and process the
+        // final actions.
+        self.actions.truncate(actions_len);
+        query.go_to_state(final_state);
+        let final_actions = query.finish().expect("should be in a final state");
+        self.actions.extend(final_actions.iter().copied());
+        self.eval_actions(context, root);
+
+        // And finally, the root of the RHS for this optimization is the
+        // last entry in `self.right_hand_sides`, so replace the old root
+        // instruction with this one!
+        let result = self.right_hand_sides.pop().unwrap();
+        let new_root = self.instr_set.replace_instruction(context, root, result);
+        Some(new_root)
+    }
+
+    /// Keep applying peephole optimizations to the given instruction until none
+    /// can be applied anymore.
+    pub fn apply_all(&mut self, context: &mut I::Context, mut inst: I::Instruction) {
+        loop {
+            if let Some(new_inst) = self.apply_one(context, inst) {
+                inst = new_inst;
+            } else {
+                break;
+            }
+        }
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/part.rs b/cranelift/peepmatic/crates/runtime/src/part.rs
new file mode 100644
index 0000000000..6190b8e980
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/part.rs
@@ -0,0 +1,128 @@
+//! Parts of instructions.
+
+use crate::cc::ConditionCode;
+use crate::r#type::BitWidth;
+use std::fmt::Debug;
+
+/// A constant value.
+///
+/// Whether an integer is interpreted as signed or unsigned depends on the
+/// operations applied to it.
+#[derive(Copy, Clone, Debug, PartialEq, Eq)]
+pub enum Constant {
+    /// A boolean of the given width.
+    Bool(bool, BitWidth),
+
+    /// An integer constant of the given width,
+    Int(u64, BitWidth),
+}
+
+/// A part of an instruction, or a whole instruction itself.
+///
+/// These are the different values that can be matched in an optimization's
+/// left-hand side and then built up in its right-hand side.
+#[derive(Copy, Clone, Debug, PartialEq, Eq)]
+pub enum Part<I>
+where
+    I: Copy + Debug + Eq,
+{
+    /// An instruction (or result of an instruction).
+    Instruction(I),
+
+    /// A constant value.
+    Constant(Constant),
+
+    /// A condition code.
+    ConditionCode(ConditionCode),
+}
+
+impl<I> From<Constant> for Part<I>
+where
+    I: Copy + Debug + Eq,
+{
+    #[inline]
+    fn from(c: Constant) -> Part<I> {
+        Part::Constant(c)
+    }
+}
+
+impl<I> From<ConditionCode> for Part<I>
+where
+    I: Copy + Debug + Eq,
+{
+    #[inline]
+    fn from(c: ConditionCode) -> Part<I> {
+        Part::ConditionCode(c)
+    }
+}
+
+macro_rules! accessors {
+    ( $( $variant:ident , $result:ty , $getter:ident , $is:ident , $unwrap:ident ; )* ) => {
+        $(
+            #[inline]
+            #[allow(missing_docs)]
+            pub fn $getter(&self) -> Option<$result> {
+                match *self {
+                    Self::$variant(x, ..) => Some(x),
+                    _ => None
+                }
+            }
+
+            #[inline]
+            #[allow(missing_docs)]
+            pub fn $is(&self) -> bool {
+                self.$getter().is_some()
+            }
+
+            #[inline]
+            #[allow(missing_docs)]
+            pub fn $unwrap(&self) -> $result {
+                self.$getter().expect(concat!("failed to unwrap `", stringify!($variant), "`"))
+            }
+        )*
+    }
+}
+
+impl Constant {
+    /// If this is any kind of integer constant, get it as a 64-bit unsigned
+    /// integer.
+    pub fn as_int(&self) -> Option<u64> {
+        match *self {
+            Constant::Bool(..) => None,
+            Constant::Int(x, _) => Some(x),
+        }
+    }
+
+    /// If this is any kind of boolean constant, get its value.
+    pub fn as_bool(&self) -> Option<bool> {
+        match *self {
+            Constant::Bool(b, _) => Some(b),
+            Constant::Int(..) => None,
+        }
+    }
+
+    /// The number of bits required to represent this constant value's type.
+    pub fn bit_width(&self, root_width: u8) -> u8 {
+        match *self {
+            Constant::Bool(_, w) | Constant::Int(_, w) => {
+                if let Some(w) = w.fixed_width() {
+                    w
+                } else {
+                    debug_assert!(w.is_polymorphic());
+                    root_width
+                }
+            }
+        }
+    }
+}
+
+impl<I> Part<I>
+where
+    I: Copy + Debug + Eq,
+{
+    accessors! {
+        Instruction, I, as_instruction, is_instruction, unwrap_instruction;
+        Constant, Constant, as_constant, is_constant, unwrap_constant;
+        ConditionCode, ConditionCode, as_condition_code, is_condition_code, unwrap_condition_code;
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/paths.rs b/cranelift/peepmatic/crates/runtime/src/paths.rs
new file mode 100644
index 0000000000..f824f19a74
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/paths.rs
@@ -0,0 +1,242 @@
+//! Representing paths through the dataflow graph.
+//!
+//! Paths are relative from a *root* instruction, which is the instruction we
+//! are determining which, if any, optimizations apply.
+//!
+//! Paths are series of indices through each instruction's children as we
+//! traverse down the graph from the root. Children are immediates followed by
+//! arguments: `[imm0, imm1, ..., immN, arg0, arg1, ..., argN]`.
+//!
+//! ## Examples
+//!
+//! * `[0]` is the path to the root.
+//! * `[0, 0]` is the path to the root's first child.
+//! * `[0, 1]` is the path to the root's second child.
+//! * `[0, 1, 0]` is the path to the root's second child's first child.
+//!
+//! ## Interning
+//!
+//! To avoid extra allocations, de-duplicate paths, and reference them via a
+//! fixed-length value, we intern paths inside a `PathInterner` and then
+//! reference them via `PathId`.
+
+// TODO: Make `[]` the path to the root, and get rid of this redundant leading
+// zero that is currently in every single path.
+
+use serde::de::{Deserializer, SeqAccess, Visitor};
+use serde::ser::{SerializeSeq, Serializer};
+use serde::{Deserialize, Serialize};
+use std::collections::HashMap;
+use std::convert::TryInto;
+use std::fmt;
+use std::hash::{Hash, Hasher};
+use std::marker::PhantomData;
+
+/// A path through the data-flow graph from the root instruction.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize)]
+pub struct Path<'a>(pub &'a [u8]);
+
+impl Path<'_> {
+    /// Construct a new path through the data-flow graph from the root
+    /// instruction.
+    pub fn new(path: &impl AsRef<[u8]>) -> Path {
+        Path(path.as_ref())
+    }
+}
+
+/// An identifier for an interned path.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct PathId(u16);
+
+/// An interner and de-duplicator for `Path`s.
+///
+/// Can be serialized and deserialized while maintaining the same id to interned
+/// path mapping.
+#[derive(Debug, Default)]
+pub struct PathInterner {
+    /// A map from a path (whose owned data is inside `arena`) to the canonical
+    /// `PathId` we assigned it when interning it.
+    map: HashMap<UnsafePath, PathId>,
+
+    /// A map from a `PathId` index to an unsafe, self-borrowed path pointing
+    /// into `arena`. It is safe to given these out as safe `Path`s, as long as
+    /// the lifetime is not longer than this `PathInterner`'s lifetime.
+    paths: Vec<UnsafePath>,
+
+    /// Bump allocation arena for path data. The bump arena ensures that these
+    /// allocations never move, and are therefore safe for self-references.
+    arena: bumpalo::Bump,
+}
+
+impl PathInterner {
+    /// Construct a new, empty `PathInterner`.
+    #[inline]
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    /// Intern a path into this `PathInterner`, returning its canonical
+    /// `PathId`.
+    ///
+    /// If we've already interned this path before, then the existing id we
+    /// already assigned to it is returned. If we've never seen this path
+    /// before, then it is copied into this `PathInterner` and a new id is
+    /// assigned to it.
+    #[inline]
+    pub fn intern<'a>(&mut self, path: Path<'a>) -> PathId {
+        let unsafe_path = unsafe { UnsafePath::from_path(&path) };
+        if let Some(id) = self.map.get(&unsafe_path) {
+            return *id;
+        }
+        self.intern_new(path)
+    }
+
+    #[inline(never)]
+    fn intern_new<'a>(&mut self, path: Path<'a>) -> PathId {
+        let id: u16 = self
+            .paths
+            .len()
+            .try_into()
+            .expect("too many paths interned");
+        let id = PathId(id);
+
+        let our_path = self.arena.alloc_slice_copy(&path.0);
+        let unsafe_path = unsafe { UnsafePath::from_slice(&our_path) };
+
+        self.paths.push(unsafe_path.clone());
+        let old = self.map.insert(unsafe_path, id);
+
+        debug_assert!(old.is_none());
+        debug_assert_eq!(self.lookup(id), path);
+        debug_assert_eq!(self.intern(path), id);
+
+        id
+    }
+
+    /// Lookup a previously interned path by id.
+    #[inline]
+    pub fn lookup<'a>(&'a self, id: PathId) -> Path<'a> {
+        let unsafe_path = self
+            .paths
+            .get(id.0 as usize)
+            .unwrap_or_else(|| Self::lookup_failure());
+        unsafe { unsafe_path.as_path() }
+    }
+
+    #[inline(never)]
+    fn lookup_failure() -> ! {
+        panic!(
+            "no path for the given id; this can only happen when mixing `PathId`s with different \
+             `PathInterner`s"
+        )
+    }
+}
+
+impl Serialize for PathInterner {
+    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
+    where
+        S: Serializer,
+    {
+        let mut seq = serializer.serialize_seq(Some(self.paths.len()))?;
+        for p in &self.paths {
+            let p = unsafe { p.as_path() };
+            seq.serialize_element(&p)?;
+        }
+        seq.end()
+    }
+}
+
+impl<'de> Deserialize<'de> for PathInterner {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        deserializer.deserialize_seq(PathInternerVisitor {
+            marker: PhantomData,
+        })
+    }
+}
+
+struct PathInternerVisitor {
+    marker: PhantomData<fn() -> PathInterner>,
+}
+
+impl<'de> Visitor<'de> for PathInternerVisitor {
+    type Value = PathInterner;
+
+    fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
+        write!(formatter, "a `peepmatic_runtime::paths::PathInterner`")
+    }
+
+    fn visit_seq<M>(self, mut access: M) -> Result<Self::Value, M::Error>
+    where
+        M: SeqAccess<'de>,
+    {
+        const DEFAULT_CAPACITY: usize = 16;
+        let capacity = access.size_hint().unwrap_or(DEFAULT_CAPACITY);
+
+        let mut interner = PathInterner {
+            map: HashMap::with_capacity(capacity),
+            paths: Vec::with_capacity(capacity),
+            arena: bumpalo::Bump::new(),
+        };
+
+        while let Some(path) = access.next_element::<Path>()? {
+            interner.intern(path);
+        }
+
+        Ok(interner)
+    }
+}
+
+/// An unsafe, unchecked borrow of a path. Not for use outside of
+/// `PathInterner`!
+#[derive(Clone, Debug)]
+struct UnsafePath {
+    ptr: *const u8,
+    len: usize,
+}
+
+impl PartialEq for UnsafePath {
+    fn eq(&self, rhs: &UnsafePath) -> bool {
+        unsafe { self.as_slice() == rhs.as_slice() }
+    }
+}
+
+impl Eq for UnsafePath {}
+
+impl Hash for UnsafePath {
+    fn hash<H>(&self, hasher: &mut H)
+    where
+        H: Hasher,
+    {
+        unsafe { self.as_slice().hash(hasher) }
+    }
+}
+
+/// Safety: callers must ensure that the constructed values won't have unsafe
+/// usages of `PartialEq`, `Eq`, or `Hash`.
+impl UnsafePath {
+    unsafe fn from_path(p: &Path) -> Self {
+        Self::from_slice(&p.0)
+    }
+
+    unsafe fn from_slice(s: &[u8]) -> Self {
+        UnsafePath {
+            ptr: s.as_ptr(),
+            len: s.len(),
+        }
+    }
+}
+
+/// Safety: callers must ensure that `'a` does not outlive the lifetime of the
+/// underlying data.
+impl UnsafePath {
+    unsafe fn as_slice<'a>(&self) -> &'a [u8] {
+        std::slice::from_raw_parts(self.ptr, self.len)
+    }
+
+    unsafe fn as_path<'a>(&self) -> Path<'a> {
+        Path(self.as_slice())
+    }
+}
diff --git a/cranelift/peepmatic/crates/runtime/src/type.rs b/cranelift/peepmatic/crates/runtime/src/type.rs
new file mode 100644
index 0000000000..e4a08c9851
--- /dev/null
+++ b/cranelift/peepmatic/crates/runtime/src/type.rs
@@ -0,0 +1,262 @@
+//! Types.
+
+use serde::{Deserialize, Serialize};
+use std::convert::TryFrom;
+use std::fmt;
+
+/// A bit width of a type.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+#[repr(u8)]
+pub enum BitWidth {
+    /// Polymorphic over bit width, with the same width as the root of the
+    /// optimization's LHS and RHS.
+    Polymorphic = 0,
+
+    /// A fixed bit width of 1.
+    One = 1,
+
+    /// A fixed bit width of 8.
+    Eight = 8,
+
+    /// A fixed bit width of 16.
+    Sixteen = 16,
+
+    /// A fixed bit width of 32.
+    ThirtyTwo = 32,
+
+    /// A fixed bit width of 64.
+    SixtyFour = 64,
+
+    /// A fixed bit width of 128.
+    OneTwentyEight = 128,
+}
+
+/// The kind of type we are looking at: either an integer kind or boolean kind.
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub enum Kind {
+    /// Integer kind.
+    Int,
+
+    /// Boolean kind.
+    Bool,
+
+    /// CPU flags kind.
+    CpuFlags,
+
+    /// Void kind.
+    Void,
+}
+
+/// A type a value or the result of an operation.
+#[allow(missing_docs)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct Type {
+    /// This type's kind.
+    pub kind: Kind,
+
+    /// This type's bit width.
+    pub bit_width: BitWidth,
+}
+
+impl TryFrom<u8> for BitWidth {
+    type Error = &'static str;
+
+    #[inline]
+    fn try_from(x: u8) -> Result<Self, Self::Error> {
+        Ok(match x {
+            1 => Self::One,
+            8 => Self::Eight,
+            16 => Self::Sixteen,
+            32 => Self::ThirtyTwo,
+            64 => Self::SixtyFour,
+            128 => Self::OneTwentyEight,
+            _ => return Err("not a valid bit width"),
+        })
+    }
+}
+
+impl fmt::Display for Type {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        match self.kind {
+            Kind::CpuFlags => return write!(f, "cpu-flags"),
+            Kind::Void => return write!(f, "void"),
+            Kind::Int => write!(f, "i")?,
+            Kind::Bool => write!(f, "b")?,
+        }
+        match self.bit_width {
+            BitWidth::Polymorphic => write!(f, "NN"),
+            otherwise => write!(f, "{}", otherwise as u8),
+        }
+    }
+}
+
+impl BitWidth {
+    /// Is this a polymorphic bit width?
+    pub fn is_polymorphic(&self) -> bool {
+        matches!(self, BitWidth::Polymorphic)
+    }
+
+    /// Get this width in bits, unless this is a polymorphic bit width.
+    pub fn fixed_width(&self) -> Option<u8> {
+        if self.is_polymorphic() {
+            None
+        } else {
+            Some(*self as u8)
+        }
+    }
+}
+
+macro_rules! type_ctors {
+    ( $( $( #[$attr:meta] )* $name:ident ( $kind:ident , $width:ident ) ; )* ) => {
+        $(
+            $( #[$attr] )*
+            pub const fn $name() -> Self {
+                Type {
+                    kind: Kind::$kind,
+                    bit_width: BitWidth::$width,
+                }
+            }
+        )*
+    }
+}
+
+impl Type {
+    type_ctors! {
+        /// Get the `i1` type.
+        i1(Int, One);
+        /// Get the `i8` type.
+        i8(Int, Eight);
+        /// Get the `i16` type.
+        i16(Int, Sixteen);
+        /// Get the `i32` type.
+        i32(Int, ThirtyTwo);
+        /// Get the `i64` type.
+        i64(Int, SixtyFour);
+        /// Get the `i128` type.
+        i128(Int, OneTwentyEight);
+        /// Get the `b1` type.
+        b1(Bool, One);
+        /// Get the `b8` type.
+        b8(Bool, Eight);
+        /// Get the `b16` type.
+        b16(Bool, Sixteen);
+        /// Get the `b32` type.
+        b32(Bool, ThirtyTwo);
+        /// Get the `b64` type.
+        b64(Bool, SixtyFour);
+        /// Get the `b128` type.
+        b128(Bool, OneTwentyEight);
+        /// Get the CPU flags type.
+        cpu_flags(CpuFlags, One);
+        /// Get the void type.
+        void(Void, One);
+    }
+}
+
+#[cfg(feature = "construct")]
+mod tok {
+    use wast::custom_keyword;
+    custom_keyword!(b1);
+    custom_keyword!(b8);
+    custom_keyword!(b16);
+    custom_keyword!(b32);
+    custom_keyword!(b64);
+    custom_keyword!(b128);
+    custom_keyword!(i1);
+    custom_keyword!(i8);
+    custom_keyword!(i16);
+    custom_keyword!(i32);
+    custom_keyword!(i64);
+    custom_keyword!(i128);
+}
+
+#[cfg(feature = "construct")]
+impl<'a> wast::parser::Parse<'a> for Type {
+    fn parse(p: wast::parser::Parser<'a>) -> wast::parser::Result<Self> {
+        if p.peek::<tok::b1>() {
+            p.parse::<tok::b1>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::One,
+            });
+        }
+        if p.peek::<tok::b8>() {
+            p.parse::<tok::b8>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::Eight,
+            });
+        }
+        if p.peek::<tok::b16>() {
+            p.parse::<tok::b16>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::Sixteen,
+            });
+        }
+        if p.peek::<tok::b32>() {
+            p.parse::<tok::b32>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::ThirtyTwo,
+            });
+        }
+        if p.peek::<tok::b64>() {
+            p.parse::<tok::b64>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::SixtyFour,
+            });
+        }
+        if p.peek::<tok::b128>() {
+            p.parse::<tok::b128>()?;
+            return Ok(Type {
+                kind: Kind::Bool,
+                bit_width: BitWidth::OneTwentyEight,
+            });
+        }
+        if p.peek::<tok::i1>() {
+            p.parse::<tok::i1>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::One,
+            });
+        }
+        if p.peek::<tok::i8>() {
+            p.parse::<tok::i8>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::Eight,
+            });
+        }
+        if p.peek::<tok::i16>() {
+            p.parse::<tok::i16>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::Sixteen,
+            });
+        }
+        if p.peek::<tok::i32>() {
+            p.parse::<tok::i32>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::ThirtyTwo,
+            });
+        }
+        if p.peek::<tok::i64>() {
+            p.parse::<tok::i64>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::SixtyFour,
+            });
+        }
+        if p.peek::<tok::i128>() {
+            p.parse::<tok::i128>()?;
+            return Ok(Type {
+                kind: Kind::Int,
+                bit_width: BitWidth::OneTwentyEight,
+            });
+        }
+        Err(p.error("expected an ascribed type"))
+    }
+}
diff --git a/cranelift/peepmatic/crates/test/Cargo.toml b/cranelift/peepmatic/crates/test/Cargo.toml
new file mode 100644
index 0000000000..bca85f8bf8
--- /dev/null
+++ b/cranelift/peepmatic/crates/test/Cargo.toml
@@ -0,0 +1,14 @@
+[package]
+name = "peepmatic-test"
+version = "0.1.0"
+authors = ["Nick Fitzgerald <fitzgen@gmail.com>"]
+edition = "2018"
+publish = false
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+env_logger = "0.7.1"
+log = "0.4.8"
+peepmatic = { path = "../.." }
+peepmatic-runtime = { path = "../runtime" }
diff --git a/cranelift/peepmatic/crates/test/src/lib.rs b/cranelift/peepmatic/crates/test/src/lib.rs
new file mode 100644
index 0000000000..f74e9b7c53
--- /dev/null
+++ b/cranelift/peepmatic/crates/test/src/lib.rs
@@ -0,0 +1,535 @@
+//! Testing utilities and a testing-only instruction set for `peepmatic`.
+
+#![deny(missing_debug_implementations)]
+
+use peepmatic_runtime::{
+    cc::ConditionCode,
+    instruction_set::InstructionSet,
+    operator::Operator,
+    part::{Constant, Part},
+    paths::Path,
+    r#type::{BitWidth, Kind, Type},
+};
+use std::cell::RefCell;
+use std::collections::BTreeMap;
+use std::convert::TryFrom;
+
+#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Debug)]
+pub struct Instruction(pub usize);
+
+#[derive(Debug)]
+pub struct InstructionData {
+    pub operator: Operator,
+    pub r#type: Type,
+    pub immediates: Vec<Immediate>,
+    pub arguments: Vec<Instruction>,
+}
+
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
+pub enum Immediate {
+    Constant(Constant),
+    ConditionCode(ConditionCode),
+}
+
+impl Immediate {
+    fn unwrap_constant(&self) -> Constant {
+        match *self {
+            Immediate::Constant(c) => c,
+            _ => panic!("not a constant"),
+        }
+    }
+}
+
+impl From<Constant> for Immediate {
+    fn from(c: Constant) -> Immediate {
+        Immediate::Constant(c)
+    }
+}
+
+impl From<ConditionCode> for Immediate {
+    fn from(cc: ConditionCode) -> Immediate {
+        Immediate::ConditionCode(cc)
+    }
+}
+
+impl From<Immediate> for Part<Instruction> {
+    fn from(imm: Immediate) -> Part<Instruction> {
+        match imm {
+            Immediate::Constant(c) => Part::Constant(c),
+            Immediate::ConditionCode(cc) => Part::ConditionCode(cc),
+        }
+    }
+}
+
+impl TryFrom<Part<Instruction>> for Immediate {
+    type Error = &'static str;
+
+    fn try_from(part: Part<Instruction>) -> Result<Immediate, Self::Error> {
+        match part {
+            Part::Constant(c) => Ok(Immediate::Constant(c)),
+            Part::ConditionCode(c) => Ok(Immediate::ConditionCode(c)),
+            Part::Instruction(_) => Err("instruction parts cannot be converted into immediates"),
+        }
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct Program {
+    instr_counter: usize,
+    instruction_data: BTreeMap<Instruction, InstructionData>,
+    replacements: RefCell<BTreeMap<Instruction, Instruction>>,
+}
+
+impl Program {
+    /// Are `a` and `b` structurally equivalent, even if they use different
+    /// `Instruction`s for various arguments?
+    pub fn structurally_eq(&mut self, a: Instruction, b: Instruction) -> bool {
+        macro_rules! ensure_eq {
+            ($a:expr, $b:expr) => {{
+                let a = &$a;
+                let b = &$b;
+                if a != b {
+                    log::debug!(
+                        "{} != {} ({:?} != {:?})",
+                        stringify!($a),
+                        stringify!($b),
+                        a,
+                        b
+                    );
+                    return false;
+                }
+            }};
+        }
+
+        let a = self.resolve(a);
+        let b = self.resolve(b);
+        if a == b {
+            return true;
+        }
+
+        let a = self.data(a);
+        let b = self.data(b);
+        log::debug!("structurally_eq({:?}, {:?})", a, b);
+
+        ensure_eq!(a.operator, b.operator);
+        ensure_eq!(a.r#type, b.r#type);
+        ensure_eq!(a.immediates, b.immediates);
+        ensure_eq!(a.arguments.len(), b.arguments.len());
+        a.arguments
+            .clone()
+            .into_iter()
+            .zip(b.arguments.clone().into_iter())
+            .all(|(a, b)| self.structurally_eq(a, b))
+    }
+
+    pub fn instructions(&self) -> impl Iterator<Item = (Instruction, &InstructionData)> {
+        self.instruction_data.iter().map(|(k, v)| (*k, v))
+    }
+
+    pub fn replace_instruction(&mut self, old: Instruction, new: Instruction) {
+        log::debug!("replacing {:?} with {:?}", old, new);
+
+        let old = self.resolve(old);
+        let new = self.resolve(new);
+        if old == new {
+            return;
+        }
+
+        let mut replacements = self.replacements.borrow_mut();
+        let existing_replacement = replacements.insert(old, new);
+        assert!(existing_replacement.is_none());
+
+        let old_data = self.instruction_data.remove(&old);
+        assert!(old_data.is_some());
+    }
+
+    pub fn resolve(&self, inst: Instruction) -> Instruction {
+        let mut replacements = self.replacements.borrow_mut();
+        let mut replacements_followed = 0;
+        let mut resolved = inst;
+        while let Some(i) = replacements.get(&resolved).cloned() {
+            log::trace!("resolving replaced instruction: {:?} -> {:?}", resolved, i);
+            replacements_followed += 1;
+            assert!(
+                replacements_followed <= replacements.len(),
+                "cyclic replacements"
+            );
+
+            resolved = i;
+            continue;
+        }
+
+        if inst != resolved {
+            let old_replacement = replacements.insert(inst, resolved);
+            assert!(old_replacement.is_some());
+        }
+
+        resolved
+    }
+
+    pub fn data(&self, inst: Instruction) -> &InstructionData {
+        let inst = self.resolve(inst);
+        &self.instruction_data[&inst]
+    }
+
+    pub fn new_instruction(
+        &mut self,
+        operator: Operator,
+        r#type: Type,
+        immediates: Vec<Immediate>,
+        arguments: Vec<Instruction>,
+    ) -> Instruction {
+        assert_eq!(
+            operator.immediates_arity() as usize,
+            immediates.len(),
+            "wrong number of immediates for {:?}: expected {}, found {}",
+            operator,
+            operator.immediates_arity(),
+            immediates.len(),
+        );
+        assert_eq!(
+            operator.params_arity() as usize,
+            arguments.len(),
+            "wrong number of arguments for {:?}: expected {}, found {}",
+            operator,
+            operator.params_arity(),
+            arguments.len(),
+        );
+
+        assert!(!r#type.bit_width.is_polymorphic());
+        assert!(immediates.iter().all(|imm| match imm {
+            Immediate::Constant(Constant::Bool(_, w))
+            | Immediate::Constant(Constant::Int(_, w)) => !w.is_polymorphic(),
+            Immediate::ConditionCode(_) => true,
+        }));
+
+        let inst = Instruction(self.instr_counter);
+        self.instr_counter += 1;
+
+        let data = InstructionData {
+            operator,
+            r#type,
+            immediates,
+            arguments,
+        };
+
+        log::trace!("new instruction: {:?} = {:?}", inst, data);
+        self.instruction_data.insert(inst, data);
+        inst
+    }
+
+    pub fn r#const(&mut self, c: Constant, root_bit_width: BitWidth) -> Instruction {
+        assert!(!root_bit_width.is_polymorphic());
+        match c {
+            Constant::Bool(_, bit_width) => self.new_instruction(
+                Operator::Bconst,
+                if bit_width.is_polymorphic() {
+                    Type {
+                        kind: Kind::Bool,
+                        bit_width: root_bit_width,
+                    }
+                } else {
+                    Type {
+                        kind: Kind::Bool,
+                        bit_width,
+                    }
+                },
+                vec![c.into()],
+                vec![],
+            ),
+            Constant::Int(_, bit_width) => self.new_instruction(
+                Operator::Iconst,
+                if bit_width.is_polymorphic() {
+                    Type {
+                        kind: Kind::Int,
+                        bit_width: root_bit_width,
+                    }
+                } else {
+                    Type {
+                        kind: Kind::Int,
+                        bit_width,
+                    }
+                },
+                vec![c.into()],
+                vec![],
+            ),
+        }
+    }
+
+    fn instruction_to_constant(&mut self, inst: Instruction) -> Option<Constant> {
+        match self.data(inst) {
+            InstructionData {
+                operator: Operator::Iconst,
+                immediates,
+                ..
+            } => Some(immediates[0].unwrap_constant()),
+            InstructionData {
+                operator: Operator::Bconst,
+                immediates,
+                ..
+            } => Some(immediates[0].unwrap_constant()),
+            _ => None,
+        }
+    }
+
+    fn part_to_immediate(&mut self, part: Part<Instruction>) -> Result<Immediate, &'static str> {
+        match part {
+            Part::Instruction(i) => self
+                .instruction_to_constant(i)
+                .map(|c| c.into())
+                .ok_or("non-constant instructions cannot be converted into immediates"),
+            Part::Constant(c) => Ok(c.into()),
+            Part::ConditionCode(cc) => Ok(Immediate::ConditionCode(cc)),
+        }
+    }
+
+    fn part_to_instruction(
+        &mut self,
+        root: Instruction,
+        part: Part<Instruction>,
+    ) -> Result<Instruction, &'static str> {
+        match part {
+            Part::Instruction(inst) => {
+                let inst = self.resolve(inst);
+                Ok(inst)
+            }
+            Part::Constant(c) => {
+                let root_width = self.data(root).r#type.bit_width;
+                Ok(self.r#const(c, root_width))
+            }
+            Part::ConditionCode(_) => Err("condition codes cannot be converted into instructions"),
+        }
+    }
+}
+
+#[derive(Debug)]
+pub struct TestIsa {
+    pub native_word_size_in_bits: u8,
+}
+
+// Unsafe because we must ensure that `instruction_result_bit_width` never
+// returns zero.
+unsafe impl<'a> InstructionSet<'a> for TestIsa {
+    type Context = Program;
+
+    type Instruction = Instruction;
+
+    fn replace_instruction(
+        &self,
+        program: &mut Program,
+        old: Instruction,
+        new: Part<Instruction>,
+    ) -> Instruction {
+        log::debug!("replace_instruction({:?}, {:?})", old, new);
+        let new = program.part_to_instruction(old, new).unwrap();
+        program.replace_instruction(old, new);
+        new
+    }
+
+    fn get_part_at_path(
+        &self,
+        program: &mut Program,
+        root: Instruction,
+        path: Path,
+    ) -> Option<Part<Instruction>> {
+        log::debug!("get_part_at_path({:?})", path);
+
+        assert!(!path.0.is_empty());
+        assert_eq!(path.0[0], 0);
+
+        let mut part = Part::Instruction(root);
+        for p in &path.0[1..] {
+            if let Part::Instruction(inst) = part {
+                let data = program.data(inst);
+                let p = *p as usize;
+
+                if p < data.immediates.len() {
+                    part = data.immediates[p].into();
+                    continue;
+                }
+
+                if let Some(inst) = data.arguments.get(p - data.immediates.len()).copied() {
+                    part = Part::Instruction(inst);
+                    continue;
+                }
+            }
+
+            return None;
+        }
+
+        Some(part)
+    }
+
+    fn operator(&self, program: &mut Program, instr: Instruction) -> Option<Operator> {
+        log::debug!("operator({:?})", instr);
+        let data = program.data(instr);
+        Some(data.operator)
+    }
+
+    fn make_inst_1(
+        &self,
+        program: &mut Program,
+        root: Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Instruction>,
+    ) -> Instruction {
+        log::debug!(
+            "make_inst_1(\n\toperator = {:?},\n\ttype = {},\n\ta = {:?},\n)",
+            operator,
+            r#type,
+            a,
+        );
+
+        let (imms, args) = match operator.immediates_arity() {
+            0 => {
+                assert_eq!(operator.params_arity(), 1);
+                (vec![], vec![program.part_to_instruction(root, a).unwrap()])
+            }
+            1 => {
+                assert_eq!(operator.params_arity(), 0);
+                (vec![program.part_to_immediate(a).unwrap()], vec![])
+            }
+            _ => unreachable!(),
+        };
+        program.new_instruction(operator, r#type, imms, args)
+    }
+
+    fn make_inst_2(
+        &self,
+        program: &mut Program,
+        root: Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Instruction>,
+        b: Part<Instruction>,
+    ) -> Instruction {
+        log::debug!(
+            "make_inst_2(\n\toperator = {:?},\n\ttype = {},\n\ta = {:?},\n\tb = {:?},\n)",
+            operator,
+            r#type,
+            a,
+            b,
+        );
+
+        let (imms, args) = match operator.immediates_arity() {
+            0 => {
+                assert_eq!(operator.params_arity(), 2);
+                (
+                    vec![],
+                    vec![
+                        program.part_to_instruction(root, a).unwrap(),
+                        program.part_to_instruction(root, b).unwrap(),
+                    ],
+                )
+            }
+            1 => {
+                assert_eq!(operator.params_arity(), 1);
+                (
+                    vec![program.part_to_immediate(a).unwrap()],
+                    vec![program.part_to_instruction(root, b).unwrap()],
+                )
+            }
+            2 => {
+                assert_eq!(operator.params_arity(), 0);
+                (
+                    vec![
+                        program.part_to_immediate(a).unwrap(),
+                        program.part_to_immediate(b).unwrap(),
+                    ],
+                    vec![],
+                )
+            }
+            _ => unreachable!(),
+        };
+        program.new_instruction(operator, r#type, imms, args)
+    }
+
+    fn make_inst_3(
+        &self,
+        program: &mut Program,
+        root: Instruction,
+        operator: Operator,
+        r#type: Type,
+        a: Part<Instruction>,
+        b: Part<Instruction>,
+        c: Part<Instruction>,
+    ) -> Instruction {
+        log::debug!(
+            "make_inst_3(\n\toperator = {:?},\n\ttype = {},\n\ta = {:?},\n\tb = {:?},\n\tc = {:?},\n)",
+            operator,
+            r#type,
+            a,
+            b,
+            c,
+        );
+        let (imms, args) = match operator.immediates_arity() {
+            0 => {
+                assert_eq!(operator.params_arity(), 3);
+                (
+                    vec![],
+                    vec![
+                        program.part_to_instruction(root, a).unwrap(),
+                        program.part_to_instruction(root, b).unwrap(),
+                        program.part_to_instruction(root, c).unwrap(),
+                    ],
+                )
+            }
+            1 => {
+                assert_eq!(operator.params_arity(), 2);
+                (
+                    vec![program.part_to_immediate(a).unwrap()],
+                    vec![
+                        program.part_to_instruction(root, b).unwrap(),
+                        program.part_to_instruction(root, c).unwrap(),
+                    ],
+                )
+            }
+            2 => {
+                assert_eq!(operator.params_arity(), 1);
+                (
+                    vec![
+                        program.part_to_immediate(a).unwrap(),
+                        program.part_to_immediate(b).unwrap(),
+                    ],
+                    vec![program.part_to_instruction(root, c).unwrap()],
+                )
+            }
+            3 => {
+                assert_eq!(operator.params_arity(), 0);
+                (
+                    vec![
+                        program.part_to_immediate(a).unwrap(),
+                        program.part_to_immediate(b).unwrap(),
+                        program.part_to_immediate(c).unwrap(),
+                    ],
+                    vec![],
+                )
+            }
+            _ => unreachable!(),
+        };
+        program.new_instruction(operator, r#type, imms, args)
+    }
+
+    fn instruction_to_constant(
+        &self,
+        program: &mut Program,
+        inst: Instruction,
+    ) -> Option<Constant> {
+        log::debug!("instruction_to_constant({:?})", inst);
+        program.instruction_to_constant(inst)
+    }
+
+    fn instruction_result_bit_width(&self, program: &mut Program, inst: Instruction) -> u8 {
+        log::debug!("instruction_result_bit_width({:?})", inst);
+        let ty = program.data(inst).r#type;
+        let width = ty.bit_width.fixed_width().unwrap();
+        assert!(width != 0);
+        width
+    }
+
+    fn native_word_size_in_bits(&self, _program: &mut Program) -> u8 {
+        log::debug!("native_word_size_in_bits");
+        self.native_word_size_in_bits
+    }
+}
diff --git a/cranelift/peepmatic/crates/test/tests/tests.rs b/cranelift/peepmatic/crates/test/tests/tests.rs
new file mode 100644
index 0000000000..989424adb8
--- /dev/null
+++ b/cranelift/peepmatic/crates/test/tests/tests.rs
@@ -0,0 +1,393 @@
+use peepmatic_runtime::{
+    cc::ConditionCode,
+    operator::Operator,
+    part::Constant,
+    r#type::{BitWidth, Type},
+};
+use peepmatic_test::*;
+
+const TEST_ISA: TestIsa = TestIsa {
+    native_word_size_in_bits: 32,
+};
+
+macro_rules! optimizer {
+    ($opts:ident, $source:expr) => {{
+        let _ = env_logger::try_init();
+        $opts = peepmatic::compile_str($source, std::path::Path::new("peepmatic-test")).unwrap();
+        $opts.optimizer(TEST_ISA)
+    }};
+}
+
+#[test]
+fn opcode() {
+    let opts;
+    let mut optimizer = optimizer!(opts, "(=> (iadd $x 0) $x)");
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let zero = program.r#const(Constant::Int(0, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let add = program.new_instruction(Operator::Iadd, Type::i32(), vec![], vec![five, zero]);
+
+    let new = optimizer.apply_one(&mut program, add);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, five));
+
+    let add = program.new_instruction(Operator::Iadd, Type::i32(), vec![], vec![five, five]);
+    let replacement = optimizer.apply_one(&mut program, add);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn constant() {
+    let opts;
+    let mut optimizer = optimizer!(opts, "(=> (iadd $C $x) (iadd_imm $C $x))");
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let zero = program.r#const(Constant::Int(0, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let add = program.new_instruction(Operator::Iadd, Type::i32(), vec![], vec![five, zero]);
+
+    let expected = program.new_instruction(
+        Operator::IaddImm,
+        Type::i32(),
+        vec![Constant::Int(5, BitWidth::ThirtyTwo).into()],
+        vec![zero],
+    );
+
+    let new = optimizer.apply_one(&mut program, add);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, expected));
+
+    let mul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, zero]);
+    let add = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![mul, five]);
+    let replacement = optimizer.apply_one(&mut program, add);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn boolean() {
+    let opts;
+    let mut optimizer = optimizer!(opts, "(=> (bint true) 1)");
+
+    let mut program = Program::default();
+    let t = program.r#const(Constant::Bool(true, BitWidth::One), BitWidth::One);
+    let bint = program.new_instruction(Operator::Bint, Type::i1(), vec![], vec![t]);
+    let one = program.r#const(Constant::Int(1, BitWidth::One), BitWidth::ThirtyTwo);
+
+    let new = optimizer.apply_one(&mut program, bint);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, one));
+
+    let f = program.r#const(Constant::Bool(false, BitWidth::One), BitWidth::One);
+    let bint = program.new_instruction(Operator::Bint, Type::i1(), vec![], vec![f]);
+    let replacement = optimizer.apply_one(&mut program, bint);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn condition_codes() {
+    let opts;
+    let mut optimizer = optimizer!(opts, "(=> (icmp eq $x $x) true)");
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::One);
+    let icmp_eq = program.new_instruction(
+        Operator::Icmp,
+        Type::b1(),
+        vec![ConditionCode::Eq.into()],
+        vec![five, five],
+    );
+    let t = program.r#const(Constant::Bool(true, BitWidth::One), BitWidth::One);
+
+    let new = optimizer.apply_one(&mut program, icmp_eq);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, t));
+
+    let icmp_ne = program.new_instruction(
+        Operator::Icmp,
+        Type::b1(),
+        vec![ConditionCode::Ne.into()],
+        vec![five, five],
+    );
+    let replacement = optimizer.apply_one(&mut program, icmp_ne);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn is_power_of_two() {
+    let opts;
+    let mut optimizer = optimizer!(
+        opts,
+        "
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $(log2 $C)))
+"
+    );
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let two = program.r#const(Constant::Int(2, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let imul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, two]);
+
+    let one = program.r#const(Constant::Int(1, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let ishl = program.new_instruction(Operator::Ishl, Type::i32(), vec![], vec![five, one]);
+
+    let new = optimizer.apply_one(&mut program, imul);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, ishl));
+
+    let three = program.r#const(Constant::Int(3, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let imul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, three]);
+
+    let replacement = optimizer.apply_one(&mut program, imul);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn bit_width() {
+    let opts;
+    let mut optimizer = optimizer!(
+        opts,
+        "
+(=> (when (imul $C $x)
+          (bit-width $C 32))
+    (imul_imm $C $x))
+"
+    );
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let two = program.r#const(Constant::Int(2, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let imul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, two]);
+
+    let imul_imm = program.new_instruction(
+        Operator::ImulImm,
+        Type::i32(),
+        vec![Constant::Int(5, BitWidth::ThirtyTwo).into()],
+        vec![two],
+    );
+
+    let new = optimizer.apply_one(&mut program, imul);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, imul_imm));
+
+    let five = program.r#const(Constant::Int(5, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let two = program.r#const(Constant::Int(2, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let imul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, two]);
+
+    let replacement = optimizer.apply_one(&mut program, imul);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn fits_in_native_word() {
+    let opts;
+    let mut optimizer = optimizer!(
+        opts,
+        "
+(=> (when (imul $C $x)
+          (fits-in-native-word $C))
+    (imul_imm $C $x))
+"
+    );
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let two = program.r#const(Constant::Int(2, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let imul = program.new_instruction(Operator::Imul, Type::i32(), vec![], vec![five, two]);
+
+    let imul_imm = program.new_instruction(
+        Operator::ImulImm,
+        Type::i32(),
+        vec![Constant::Int(5, BitWidth::ThirtyTwo).into()],
+        vec![two],
+    );
+
+    let new = optimizer.apply_one(&mut program, imul);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, imul_imm));
+
+    let five = program.r#const(Constant::Int(5, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let two = program.r#const(Constant::Int(2, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let imul = program.new_instruction(Operator::Imul, Type::i64(), vec![], vec![five, two]);
+
+    let replacement = optimizer.apply_one(&mut program, imul);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn unquote_neg() {
+    let opts;
+    let mut optimizer = optimizer!(
+        opts,
+        "
+(=> (isub $x $C)
+    (iadd_imm $(neg $C) $x))
+"
+    );
+
+    let mut program = Program::default();
+    let five = program.r#const(Constant::Int(5, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let two = program.r#const(Constant::Int(2, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let isub = program.new_instruction(Operator::Isub, Type::i64(), vec![], vec![five, two]);
+
+    let iadd_imm = program.new_instruction(
+        Operator::IaddImm,
+        Type::i64(),
+        vec![Constant::Int(-2 as _, BitWidth::SixtyFour).into()],
+        vec![five],
+    );
+
+    let new = optimizer.apply_one(&mut program, isub);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, iadd_imm));
+}
+
+#[test]
+fn subsumption() {
+    let opts;
+    let mut optimizer = optimizer!(
+        opts,
+        "
+;; NB: the following optimizations are ordered from least to most general, so
+;; the first applicable optimization should be the one that is applied.
+
+(=> (iadd (iadd (iadd $w $x) $y) $z)
+    (iadd (iadd $w $x) (iadd $y $z)))
+
+(=> (iadd $C1 $C2)
+    $(iadd $C1 $C2))
+
+(=> (iadd $C $x)
+    (iadd_imm $C $x))
+
+(=> (iadd $x $x)
+    (ishl_imm 1 $x))
+"
+    );
+
+    let mut program = Program::default();
+
+    let w = program.r#const(Constant::Int(11, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let x = program.r#const(Constant::Int(22, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let y = program.r#const(Constant::Int(33, BitWidth::SixtyFour), BitWidth::SixtyFour);
+    let z = program.r#const(Constant::Int(44, BitWidth::SixtyFour), BitWidth::SixtyFour);
+
+    log::debug!("(iadd (iadd (iadd w x) y) z) => (iadd (iadd w x) (iadd y z))");
+
+    let iadd = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![w, x]);
+    let iadd = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![iadd, y]);
+    let iadd = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![iadd, z]);
+    let expected_lhs = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![w, x]);
+    let expected_rhs = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![y, z]);
+    let expected = program.new_instruction(
+        Operator::Iadd,
+        Type::i64(),
+        vec![],
+        vec![expected_lhs, expected_rhs],
+    );
+
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, expected));
+
+    log::debug!("(iadd w x) => y");
+
+    let iadd = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![w, x]);
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, y));
+
+    log::debug!("(iadd x (iadd y z)) => (iadd_imm x (iadd y z))");
+
+    let iadd_y_z = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![y, z]);
+    let iadd = program.new_instruction(Operator::Iadd, Type::i64(), vec![], vec![x, iadd_y_z]);
+    let iadd_imm = program.new_instruction(
+        Operator::IaddImm,
+        Type::i64(),
+        vec![Constant::Int(22, BitWidth::SixtyFour).into()],
+        vec![iadd_y_z],
+    );
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, iadd_imm));
+
+    log::debug!("(iadd (imul_imm x 1) (imul_imm x 1)) => (ishl_imm 1 (imul_imm x 1))");
+
+    let imul_imm = program.new_instruction(
+        Operator::ImulImm,
+        Type::i64(),
+        vec![Constant::Int(1, BitWidth::SixtyFour).into()],
+        vec![x],
+    );
+    let iadd = program.new_instruction(
+        Operator::Iadd,
+        Type::i64(),
+        vec![],
+        vec![imul_imm, imul_imm],
+    );
+    let ishl_imm = program.new_instruction(
+        Operator::IshlImm,
+        Type::i64(),
+        vec![Constant::Int(1, BitWidth::SixtyFour).into()],
+        vec![imul_imm],
+    );
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, ishl_imm));
+
+    log::debug!("(iadd (imul w x) (imul y z)) does not match any optimization.");
+
+    let imul_w_x = program.new_instruction(Operator::Imul, Type::i64(), vec![], vec![w, x]);
+    let imul_y_z = program.new_instruction(Operator::Imul, Type::i64(), vec![], vec![y, z]);
+    let iadd = program.new_instruction(
+        Operator::Iadd,
+        Type::i64(),
+        vec![],
+        vec![imul_w_x, imul_y_z],
+    );
+
+    let replacement = optimizer.apply_one(&mut program, iadd);
+    assert!(replacement.is_none());
+}
+
+#[test]
+fn polymorphic_bit_widths() {
+    let opts;
+    let mut optimizer = optimizer!(opts, "(=> (iadd $C $x) (iadd_imm $C $x))");
+
+    let mut program = Program::default();
+
+    // Applies to 32 bit adds.
+
+    let x = program.r#const(Constant::Int(42, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let y = program.r#const(Constant::Int(420, BitWidth::ThirtyTwo), BitWidth::ThirtyTwo);
+    let iadd = program.new_instruction(Operator::Iadd, Type::i32(), vec![], vec![x, y]);
+    let iadd_imm = program.new_instruction(
+        Operator::IaddImm,
+        Type::i32(),
+        vec![Constant::Int(42, BitWidth::ThirtyTwo).into()],
+        vec![y],
+    );
+
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, iadd_imm));
+
+    // Applies to 16 bit adds.
+
+    let x = program.r#const(Constant::Int(42, BitWidth::Sixteen), BitWidth::Sixteen);
+    let y = program.r#const(Constant::Int(420, BitWidth::Sixteen), BitWidth::Sixteen);
+    let iadd = program.new_instruction(Operator::Iadd, Type::i16(), vec![], vec![x, y]);
+    let iadd_imm = program.new_instruction(
+        Operator::IaddImm,
+        Type::i16(),
+        vec![Constant::Int(42, BitWidth::Sixteen).into()],
+        vec![y],
+    );
+
+    let new = optimizer.apply_one(&mut program, iadd);
+    let new = new.expect("optimization should have applied");
+    assert!(program.structurally_eq(new, iadd_imm));
+}
diff --git a/cranelift/peepmatic/examples/mul-by-pow2.peepmatic b/cranelift/peepmatic/examples/mul-by-pow2.peepmatic
new file mode 100644
index 0000000000..cca78a372f
--- /dev/null
+++ b/cranelift/peepmatic/examples/mul-by-pow2.peepmatic
@@ -0,0 +1,3 @@
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $(log2 $C)))
diff --git a/cranelift/peepmatic/examples/redundant-bor.peepmatic b/cranelift/peepmatic/examples/redundant-bor.peepmatic
new file mode 100644
index 0000000000..d8d6f4a144
--- /dev/null
+++ b/cranelift/peepmatic/examples/redundant-bor.peepmatic
@@ -0,0 +1,13 @@
+;; Remove redundant bitwise OR instructions that are no-ops.
+
+(=> (bor $x (bor $x $y))
+    (bor $x $y))
+
+(=> (bor $y (bor $x $y))
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $x)
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $y)
+    (bor $x $y))
diff --git a/cranelift/peepmatic/examples/redundant-bor.png b/cranelift/peepmatic/examples/redundant-bor.png
new file mode 100644
index 0000000000..dab873e6cf
Binary files /dev/null and b/cranelift/peepmatic/examples/redundant-bor.png differ
diff --git a/cranelift/peepmatic/examples/simple.peepmatic b/cranelift/peepmatic/examples/simple.peepmatic
new file mode 100644
index 0000000000..a90e0c1a69
--- /dev/null
+++ b/cranelift/peepmatic/examples/simple.peepmatic
@@ -0,0 +1,11 @@
+(=> (bor $x (bor $x $y))
+    (bor $x $y))
+
+(=> (bor $y (bor $x $y))
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $x)
+    (bor $x $y))
+
+(=> (bor (bor $x $y) $y)
+    (bor $x $y))
diff --git a/cranelift/peepmatic/src/ast.rs b/cranelift/peepmatic/src/ast.rs
new file mode 100644
index 0000000000..daac871553
--- /dev/null
+++ b/cranelift/peepmatic/src/ast.rs
@@ -0,0 +1,508 @@
+//! Abstract syntax tree type definitions.
+//!
+//! This file makes fairly heavy use of macros, which are defined in the
+//! `peepmatic_macro` crate that lives at `crates/macro`. Notably, the following
+//! traits are all derived via `derive(Ast)`:
+//!
+//! * `Span` -- access the `wast::Span` where an AST node was parsed from. For
+//!   `struct`s, there must be a `span: wast::Span` field, because the macro
+//!   always generates an implementation that returns `self.span` for
+//!   `struct`s. For `enum`s, every variant must have a single, unnamed field
+//!   which implements the `Span` trait. The macro will generate code to return
+//!   the span of whatever variant it is.
+//!
+//! * `ChildNodes` -- get each of the child AST nodes that a given node
+//!   references. Some fields in an AST type aren't actually considered an AST
+//!   node (like spans) and these are ignored via the `#[peepmatic(skip_child)]`
+//!   attribute. Some fields contain multiple AST nodes (like vectors of
+//!   operands) and these are flattened with `#[peepmatic(flatten)]`.
+//!
+//! * `From<&'a Self> for DynAstRef<'a>` -- convert a particular AST type into
+//!   `DynAstRef`, which is an `enum` of all the different kinds of AST nodes.
+
+use peepmatic_macro::Ast;
+use peepmatic_runtime::{
+    operator::{Operator, UnquoteOperator},
+    r#type::{BitWidth, Type},
+};
+use std::cell::Cell;
+use std::hash::{Hash, Hasher};
+use std::marker::PhantomData;
+use wast::Id;
+
+/// A reference to any AST node.
+#[derive(Debug, Clone, Copy)]
+pub enum DynAstRef<'a> {
+    /// A reference to an `Optimizations`.
+    Optimizations(&'a Optimizations<'a>),
+
+    /// A reference to an `Optimization`.
+    Optimization(&'a Optimization<'a>),
+
+    /// A reference to an `Lhs`.
+    Lhs(&'a Lhs<'a>),
+
+    /// A reference to an `Rhs`.
+    Rhs(&'a Rhs<'a>),
+
+    /// A reference to a `Pattern`.
+    Pattern(&'a Pattern<'a>),
+
+    /// A reference to a `Precondition`.
+    Precondition(&'a Precondition<'a>),
+
+    /// A reference to a `ConstraintOperand`.
+    ConstraintOperand(&'a ConstraintOperand<'a>),
+
+    /// A reference to a `ValueLiteral`.
+    ValueLiteral(&'a ValueLiteral<'a>),
+
+    /// A reference to a `Constant`.
+    Constant(&'a Constant<'a>),
+
+    /// A reference to a `PatternOperation`.
+    PatternOperation(&'a Operation<'a, Pattern<'a>>),
+
+    /// A reference to a `Variable`.
+    Variable(&'a Variable<'a>),
+
+    /// A reference to an `Integer`.
+    Integer(&'a Integer<'a>),
+
+    /// A reference to a `Boolean`.
+    Boolean(&'a Boolean<'a>),
+
+    /// A reference to a `ConditionCode`.
+    ConditionCode(&'a ConditionCode<'a>),
+
+    /// A reference to an `Unquote`.
+    Unquote(&'a Unquote<'a>),
+
+    /// A reference to an `RhsOperation`.
+    RhsOperation(&'a Operation<'a, Rhs<'a>>),
+}
+
+impl<'a, 'b> ChildNodes<'a, 'b> for DynAstRef<'a> {
+    fn child_nodes(&'b self, sink: &mut impl Extend<DynAstRef<'a>>) {
+        match self {
+            Self::Optimizations(x) => x.child_nodes(sink),
+            Self::Optimization(x) => x.child_nodes(sink),
+            Self::Lhs(x) => x.child_nodes(sink),
+            Self::Rhs(x) => x.child_nodes(sink),
+            Self::Pattern(x) => x.child_nodes(sink),
+            Self::Precondition(x) => x.child_nodes(sink),
+            Self::ConstraintOperand(x) => x.child_nodes(sink),
+            Self::ValueLiteral(x) => x.child_nodes(sink),
+            Self::Constant(x) => x.child_nodes(sink),
+            Self::PatternOperation(x) => x.child_nodes(sink),
+            Self::Variable(x) => x.child_nodes(sink),
+            Self::Integer(x) => x.child_nodes(sink),
+            Self::Boolean(x) => x.child_nodes(sink),
+            Self::ConditionCode(x) => x.child_nodes(sink),
+            Self::Unquote(x) => x.child_nodes(sink),
+            Self::RhsOperation(x) => x.child_nodes(sink),
+        }
+    }
+}
+
+/// A trait implemented by all AST nodes.
+///
+/// All AST nodes can:
+///
+/// * Enumerate their children via `ChildNodes`.
+///
+/// * Give you the `wast::Span` where they were defined.
+///
+/// * Be converted into a `DynAstRef`.
+///
+/// This trait is blanked implemented for everything that does those three
+/// things, and in practice those three thrings are all implemented by the
+/// `derive(Ast)` macro.
+pub trait Ast<'a>: 'a + ChildNodes<'a, 'a> + Span
+where
+    DynAstRef<'a>: From<&'a Self>,
+{
+}
+
+impl<'a, T> Ast<'a> for T
+where
+    T: 'a + ?Sized + ChildNodes<'a, 'a> + Span,
+    DynAstRef<'a>: From<&'a Self>,
+{
+}
+
+/// Enumerate the child AST nodes of a given node.
+pub trait ChildNodes<'a, 'b> {
+    /// Get each of this AST node's children, in order.
+    fn child_nodes(&'b self, sink: &mut impl Extend<DynAstRef<'a>>);
+}
+
+/// A trait for getting the span where an AST node was defined.
+pub trait Span {
+    /// Get the span where this AST node was defined.
+    fn span(&self) -> wast::Span;
+}
+
+/// A set of optimizations.
+///
+/// This is the root AST node.
+#[derive(Debug, Ast)]
+pub struct Optimizations<'a> {
+    /// Where these `Optimizations` were defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The optimizations.
+    #[peepmatic(flatten)]
+    pub optimizations: Vec<Optimization<'a>>,
+}
+
+/// A complete optimization: a left-hand side to match against and a right-hand
+/// side replacement.
+#[derive(Debug, Ast)]
+pub struct Optimization<'a> {
+    /// Where this `Optimization` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The left-hand side that matches when this optimization applies.
+    pub lhs: Lhs<'a>,
+
+    /// The new sequence of instructions to replace an old sequence that matches
+    /// the left-hand side with.
+    pub rhs: Rhs<'a>,
+}
+
+/// A left-hand side describes what is required for a particular optimization to
+/// apply.
+///
+/// A left-hand side has two parts: a structural pattern for describing
+/// candidate instruction sequences, and zero or more preconditions that add
+/// additional constraints upon instruction sequences matched by the pattern.
+#[derive(Debug, Ast)]
+pub struct Lhs<'a> {
+    /// Where this `Lhs` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// A pattern that describes sequences of instructions to match.
+    pub pattern: Pattern<'a>,
+
+    /// Additional constraints that a match must satisfy in addition to
+    /// structually matching the pattern, e.g. some constant must be a power of
+    /// two.
+    #[peepmatic(flatten)]
+    pub preconditions: Vec<Precondition<'a>>,
+}
+
+/// A structural pattern, potentially with wildcard variables for matching whole
+/// subtrees.
+#[derive(Debug, Ast)]
+pub enum Pattern<'a> {
+    /// A specific value. These are written as `1234` or `0x1234` or `true` or
+    /// `false`.
+    ValueLiteral(ValueLiteral<'a>),
+
+    /// A constant that matches any constant value. This subsumes value
+    /// patterns. These are upper-case identifiers like `$C`.
+    Constant(Constant<'a>),
+
+    /// An operation pattern with zero or more operand patterns. These are
+    /// s-expressions like `(iadd $x $y)`.
+    Operation(Operation<'a, Pattern<'a>>),
+
+    /// A variable that matches any kind of subexpression. This subsumes all
+    /// other patterns. These are lower-case identifiers like `$x`.
+    Variable(Variable<'a>),
+}
+
+/// An integer or boolean value literal.
+#[derive(Debug, Ast)]
+pub enum ValueLiteral<'a> {
+    /// An integer value.
+    Integer(Integer<'a>),
+
+    /// A boolean value: `true` or `false`.
+    Boolean(Boolean<'a>),
+
+    /// A condition code: `eq`, `ne`, etc...
+    ConditionCode(ConditionCode<'a>),
+}
+
+/// An integer literal.
+#[derive(Debug, PartialEq, Eq, Ast)]
+pub struct Integer<'a> {
+    /// Where this `Integer` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The integer value.
+    ///
+    /// Note that although Cranelift allows 128 bits wide values, the widest
+    /// supported constants as immediates are 64 bits.
+    #[peepmatic(skip_child)]
+    pub value: i64,
+
+    /// The bit width of this integer.
+    ///
+    /// This is either a fixed bit width, or polymorphic over the width of the
+    /// optimization.
+    ///
+    /// This field is initialized from `None` to `Some` by the type checking
+    /// pass in `src/verify.rs`.
+    #[peepmatic(skip_child)]
+    pub bit_width: Cell<Option<BitWidth>>,
+
+    #[allow(missing_docs)]
+    #[peepmatic(skip_child)]
+    pub marker: PhantomData<&'a ()>,
+}
+
+impl Hash for Integer<'_> {
+    fn hash<H>(&self, state: &mut H)
+    where
+        H: Hasher,
+    {
+        let Integer {
+            span,
+            value,
+            bit_width,
+            marker: _,
+        } = self;
+        span.hash(state);
+        value.hash(state);
+        let bit_width = bit_width.get();
+        bit_width.hash(state);
+    }
+}
+
+/// A boolean literal.
+#[derive(Debug, PartialEq, Eq, Ast)]
+pub struct Boolean<'a> {
+    /// Where this `Boolean` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The boolean value.
+    #[peepmatic(skip_child)]
+    pub value: bool,
+
+    /// The bit width of this boolean.
+    ///
+    /// This is either a fixed bit width, or polymorphic over the width of the
+    /// optimization.
+    ///
+    /// This field is initialized from `None` to `Some` by the type checking
+    /// pass in `src/verify.rs`.
+    #[peepmatic(skip_child)]
+    pub bit_width: Cell<Option<BitWidth>>,
+
+    #[allow(missing_docs)]
+    #[peepmatic(skip_child)]
+    pub marker: PhantomData<&'a ()>,
+}
+
+impl Hash for Boolean<'_> {
+    fn hash<H>(&self, state: &mut H)
+    where
+        H: Hasher,
+    {
+        let Boolean {
+            span,
+            value,
+            bit_width,
+            marker: _,
+        } = self;
+        span.hash(state);
+        value.hash(state);
+        let bit_width = bit_width.get();
+        bit_width.hash(state);
+    }
+}
+
+/// A condition code.
+#[derive(Debug, Ast)]
+pub struct ConditionCode<'a> {
+    /// Where this `ConditionCode` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The actual condition code.
+    #[peepmatic(skip_child)]
+    pub cc: peepmatic_runtime::cc::ConditionCode,
+
+    #[allow(missing_docs)]
+    #[peepmatic(skip_child)]
+    pub marker: PhantomData<&'a ()>,
+}
+
+/// A symbolic constant.
+///
+/// These are identifiers containing uppercase letters: `$C`, `$MY-CONST`,
+/// `$CONSTANT1`.
+#[derive(Debug, Ast)]
+pub struct Constant<'a> {
+    /// Where this `Constant` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// This constant's identifier.
+    #[peepmatic(skip_child)]
+    pub id: Id<'a>,
+}
+
+/// A variable that matches any subtree.
+///
+/// Duplicate uses of the same variable constrain each occurrence's match to
+/// being the same as each other occurrence as well, e.g. `(iadd $x $x)` matches
+/// `(iadd 5 5)` but not `(iadd 1 2)`.
+#[derive(Debug, Ast)]
+pub struct Variable<'a> {
+    /// Where this `Variable` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// This variable's identifier.
+    #[peepmatic(skip_child)]
+    pub id: Id<'a>,
+}
+
+/// An operation with an operator, and operands of type `T`.
+#[derive(Debug, Ast)]
+#[peepmatic(no_into_dyn_node)]
+pub struct Operation<'a, T>
+where
+    T: 'a + Ast<'a>,
+    DynAstRef<'a>: From<&'a T>,
+{
+    /// The span where this operation was written.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The operator for this operation, e.g. `imul` or `iadd`.
+    #[peepmatic(skip_child)]
+    pub operator: Operator,
+
+    /// An optional ascribed or inferred type for the operator.
+    #[peepmatic(skip_child)]
+    pub r#type: Cell<Option<Type>>,
+
+    /// This operation's operands.
+    ///
+    /// When `Operation` is used in a pattern, these are the sub-patterns for
+    /// the operands. When `Operation is used in a right-hand side replacement,
+    /// these are the sub-replacements for the operands.
+    #[peepmatic(flatten)]
+    pub operands: Vec<T>,
+
+    #[allow(missing_docs)]
+    #[peepmatic(skip_child)]
+    pub marker: PhantomData<&'a ()>,
+}
+
+impl<'a> From<&'a Operation<'a, Pattern<'a>>> for DynAstRef<'a> {
+    #[inline]
+    fn from(o: &'a Operation<'a, Pattern<'a>>) -> DynAstRef<'a> {
+        DynAstRef::PatternOperation(o)
+    }
+}
+
+impl<'a> From<&'a Operation<'a, Rhs<'a>>> for DynAstRef<'a> {
+    #[inline]
+    fn from(o: &'a Operation<'a, Rhs<'a>>) -> DynAstRef<'a> {
+        DynAstRef::RhsOperation(o)
+    }
+}
+
+/// A precondition adds additional constraints to a pattern, such as "$C must be
+/// a power of two".
+#[derive(Debug, Ast)]
+pub struct Precondition<'a> {
+    /// Where this `Precondition` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The constraint operator.
+    #[peepmatic(skip_child)]
+    pub constraint: Constraint,
+
+    /// The operands of the constraint.
+    #[peepmatic(flatten)]
+    pub operands: Vec<ConstraintOperand<'a>>,
+}
+
+/// Contraint operators.
+#[derive(Clone, Copy, PartialEq, Eq, Hash, Debug)]
+pub enum Constraint {
+    /// Is the operand a power of two?
+    IsPowerOfTwo,
+
+    /// Check the bit width of a value.
+    BitWidth,
+
+    /// Does the argument fit within our target architecture's native word size?
+    FitsInNativeWord,
+}
+
+/// An operand of a precondition's constraint.
+#[derive(Debug, Ast)]
+pub enum ConstraintOperand<'a> {
+    /// A value literal operand.
+    ValueLiteral(ValueLiteral<'a>),
+
+    /// A constant operand.
+    Constant(Constant<'a>),
+
+    /// A variable operand.
+    Variable(Variable<'a>),
+}
+
+/// The right-hand side of an optimization that contains the instructions to
+/// replace any matched left-hand side with.
+#[derive(Debug, Ast)]
+pub enum Rhs<'a> {
+    /// A value literal right-hand side.
+    ValueLiteral(ValueLiteral<'a>),
+
+    /// A constant right-hand side (the constant must have been matched and
+    /// bound in the left-hand side's pattern).
+    Constant(Constant<'a>),
+
+    /// A variable right-hand side (the variable must have been matched and
+    /// bound in the left-hand side's pattern).
+    Variable(Variable<'a>),
+
+    /// An unquote expression that is evaluated while replacing the left-hand
+    /// side with the right-hand side. The result of the evaluation is used in
+    /// the replacement.
+    Unquote(Unquote<'a>),
+
+    /// A compound right-hand side consisting of an operation and subsequent
+    /// right-hand side operands.
+    Operation(Operation<'a, Rhs<'a>>),
+}
+
+/// An unquote operation.
+///
+/// Rather than replaciong a left-hand side, these are evaluated and then the
+/// result of the evaluation replaces the left-hand side. This allows for
+/// compile-time computation while replacing a matched left-hand side with a
+/// right-hand side.
+///
+/// For example, given the unqouted right-hand side `$(log2 $C)`, we replace any
+/// instructions that match its left-hand side with the compile-time result of
+/// `log2($C)` (the left-hand side must match and bind the constant `$C`).
+#[derive(Debug, Ast)]
+pub struct Unquote<'a> {
+    /// Where this `Unquote` was defined.
+    #[peepmatic(skip_child)]
+    pub span: wast::Span,
+
+    /// The operator for this unquote operation.
+    #[peepmatic(skip_child)]
+    pub operator: UnquoteOperator,
+
+    /// The operands for this unquote operation.
+    #[peepmatic(flatten)]
+    pub operands: Vec<Rhs<'a>>,
+}
diff --git a/cranelift/peepmatic/src/automatize.rs b/cranelift/peepmatic/src/automatize.rs
new file mode 100644
index 0000000000..de053c5574
--- /dev/null
+++ b/cranelift/peepmatic/src/automatize.rs
@@ -0,0 +1,31 @@
+//! Compile a set of linear optimizations into an automaton.
+
+use peepmatic_automata::{Automaton, Builder};
+use peepmatic_runtime::linear;
+
+/// Construct an automaton from a set of linear optimizations.
+pub fn automatize(
+    opts: &linear::Optimizations,
+) -> Automaton<linear::MatchResult, linear::MatchOp, Box<[linear::Action]>> {
+    debug_assert!(crate::linear_passes::is_sorted_lexicographically(opts));
+
+    let mut builder = Builder::<linear::MatchResult, linear::MatchOp, Box<[linear::Action]>>::new();
+
+    for opt in &opts.optimizations {
+        let mut insertion = builder.insert();
+        for inc in &opt.increments {
+            // Ensure that this state's associated data is this increment's
+            // match operation.
+            if let Some(op) = insertion.get_state_data() {
+                assert_eq!(*op, inc.operation);
+            } else {
+                insertion.set_state_data(inc.operation);
+            }
+
+            insertion.next(inc.expected, inc.actions.clone().into_boxed_slice());
+        }
+        insertion.finish();
+    }
+
+    builder.finish()
+}
diff --git a/cranelift/peepmatic/src/dot_fmt.rs b/cranelift/peepmatic/src/dot_fmt.rs
new file mode 100644
index 0000000000..6939577147
--- /dev/null
+++ b/cranelift/peepmatic/src/dot_fmt.rs
@@ -0,0 +1,145 @@
+//! Formatting a peephole optimizer's automata for GraphViz Dot.
+//!
+//! See also `crates/automata/src/dot.rs`.
+
+use peepmatic_automata::dot::DotFmt;
+use peepmatic_runtime::{
+    cc::ConditionCode,
+    integer_interner::{IntegerId, IntegerInterner},
+    linear,
+    operator::Operator,
+    paths::{PathId, PathInterner},
+};
+use std::convert::{TryFrom, TryInto};
+use std::io::{self, Write};
+use std::num::NonZeroU16;
+
+#[derive(Debug)]
+pub(crate) struct PeepholeDotFmt<'a>(pub(crate) &'a PathInterner, pub(crate) &'a IntegerInterner);
+
+impl DotFmt<linear::MatchResult, linear::MatchOp, Box<[linear::Action]>> for PeepholeDotFmt<'_> {
+    fn fmt_transition(
+        &self,
+        w: &mut impl Write,
+        from: Option<&linear::MatchOp>,
+        input: &linear::MatchResult,
+        _to: Option<&linear::MatchOp>,
+    ) -> io::Result<()> {
+        let from = from.expect("we should have match op for every state");
+        if let Some(x) = input.ok().map(|x| x.get()) {
+            match from {
+                linear::MatchOp::Opcode { .. } => {
+                    let opcode =
+                        Operator::try_from(x).expect("we shouldn't generate non-opcode edges");
+                    write!(w, "{}", opcode)
+                }
+                linear::MatchOp::ConditionCode { .. } => {
+                    let cc =
+                        ConditionCode::try_from(x).expect("we shouldn't generate non-CC edges");
+                    write!(w, "{}", cc)
+                }
+                linear::MatchOp::IntegerValue { .. } => {
+                    let x = self
+                        .1
+                        .lookup(IntegerId(NonZeroU16::new(x.try_into().unwrap()).unwrap()));
+                    write!(w, "{}", x)
+                }
+                _ => write!(w, "Ok({})", x),
+            }
+        } else {
+            write!(w, "(else)")
+        }
+    }
+
+    fn fmt_state(&self, w: &mut impl Write, op: &linear::MatchOp) -> io::Result<()> {
+        use linear::MatchOp::*;
+
+        write!(w, r#"<font face="monospace">"#)?;
+
+        let p = p(self.0);
+        match op {
+            Opcode { path } => write!(w, "opcode @ {}", p(path))?,
+            IsConst { path } => write!(w, "is-const? @ {}", p(path))?,
+            IsPowerOfTwo { path } => write!(w, "is-power-of-two? @ {}", p(path))?,
+            BitWidth { path } => write!(w, "bit-width @ {}", p(path))?,
+            FitsInNativeWord { path } => write!(w, "fits-in-native-word @ {}", p(path))?,
+            Eq { path_a, path_b } => write!(w, "{} == {}", p(path_a), p(path_b))?,
+            IntegerValue { path } => write!(w, "integer-value @ {}", p(path))?,
+            BooleanValue { path } => write!(w, "boolean-value @ {}", p(path))?,
+            ConditionCode { path } => write!(w, "condition-code @ {}", p(path))?,
+            Nop => write!(w, "nop")?,
+        }
+
+        writeln!(w, "</font>")
+    }
+
+    fn fmt_output(&self, w: &mut impl Write, actions: &Box<[linear::Action]>) -> io::Result<()> {
+        use linear::Action::*;
+
+        if actions.is_empty() {
+            return writeln!(w, "(no output)");
+        }
+
+        write!(w, r#"<font face="monospace">"#)?;
+
+        let p = p(self.0);
+
+        for a in actions.iter() {
+            match a {
+                GetLhs { path } => write!(w, "get-lhs @ {}<br/>", p(path))?,
+                UnaryUnquote { operator, operand } => {
+                    write!(w, "eval {} $rhs{}<br/>", operator, operand.0)?
+                }
+                BinaryUnquote { operator, operands } => write!(
+                    w,
+                    "eval {} $rhs{}, $rhs{}<br/>",
+                    operator, operands[0].0, operands[1].0,
+                )?,
+                MakeIntegerConst {
+                    value,
+                    bit_width: _,
+                } => write!(w, "make {}<br/>", self.1.lookup(*value))?,
+                MakeBooleanConst {
+                    value,
+                    bit_width: _,
+                } => write!(w, "make {}<br/>", value)?,
+                MakeConditionCode { cc } => write!(w, "{}<br/>", cc)?,
+                MakeUnaryInst {
+                    operand,
+                    operator,
+                    r#type: _,
+                } => write!(w, "make {} $rhs{}<br/>", operator, operand.0,)?,
+                MakeBinaryInst {
+                    operator,
+                    operands,
+                    r#type: _,
+                } => write!(
+                    w,
+                    "make {} $rhs{}, $rhs{}<br/>",
+                    operator, operands[0].0, operands[1].0,
+                )?,
+                MakeTernaryInst {
+                    operator,
+                    operands,
+                    r#type: _,
+                } => write!(
+                    w,
+                    "make {} $rhs{}, $rhs{}, $rhs{}<br/>",
+                    operator, operands[0].0, operands[1].0, operands[2].0,
+                )?,
+            }
+        }
+
+        writeln!(w, "</font>")
+    }
+}
+
+fn p<'a>(paths: &'a PathInterner) -> impl Fn(&PathId) -> String + 'a {
+    move |path: &PathId| {
+        let mut s = vec![];
+        for b in paths.lookup(*path).0 {
+            s.push(b.to_string());
+        }
+        s.join(".")
+    }
+}
diff --git a/cranelift/peepmatic/src/lib.rs b/cranelift/peepmatic/src/lib.rs
new file mode 100755
index 0000000000..407ba3670d
--- /dev/null
+++ b/cranelift/peepmatic/src/lib.rs
@@ -0,0 +1,165 @@
+/*!
+
+`peepmatic` is a DSL and compiler for generating peephole optimizers.
+
+The user writes a set of optimizations in the DSL, and then `peepmatic` compiles
+the set of optimizations into an efficient peephole optimizer.
+
+ */
+
+#![deny(missing_docs)]
+#![deny(missing_debug_implementations)]
+
+mod ast;
+mod automatize;
+mod dot_fmt;
+mod linear_passes;
+mod linearize;
+mod parser;
+mod traversals;
+mod verify;
+pub use self::{
+    ast::*, automatize::*, linear_passes::*, linearize::*, parser::*, traversals::*, verify::*,
+};
+
+use peepmatic_runtime::PeepholeOptimizations;
+use std::fs;
+use std::path::Path;
+
+/// Compile the given DSL file into a compact peephole optimizations automaton!
+///
+/// ## Example
+///
+/// ```no_run
+/// # fn main() -> anyhow::Result<()> {
+/// use std::path::Path;
+///
+/// let peep_opts = peepmatic::compile_file(Path::new(
+///     "path/to/optimizations.peepmatic"
+/// ))?;
+///
+/// // Use the peephole optimizations or serialize them into bytes here...
+/// # Ok(())
+/// # }
+/// ```
+///
+/// ## Visualizing the Peephole Optimizer's Automaton
+///
+/// To visualize (or debug) the peephole optimizer's automaton, set the
+/// `PEEPMATIC_DOT` environment variable to a file path. A [GraphViz
+/// Dot]((https://graphviz.gitlab.io/_pages/pdf/dotguide.pdf)) file showing the
+/// peephole optimizer's automaton will be written to that file path.
+pub fn compile_file(filename: &Path) -> anyhow::Result<PeepholeOptimizations> {
+    let source = fs::read_to_string(filename)?;
+    compile_str(&source, filename)
+}
+
+/// Compile the given DSL source text down into a compact peephole optimizations
+/// automaton.
+///
+/// This is like [compile_file][crate::compile_file] but you bring your own file
+/// I/O.
+///
+/// The `filename` parameter is used to provide better error messages.
+///
+/// ## Example
+///
+/// ```no_run
+/// # fn main() -> anyhow::Result<()> {
+/// use std::path::Path;
+///
+/// let peep_opts = peepmatic::compile_str(
+///     "
+///     (=> (iadd $x 0) $x)
+///     (=> (imul $x 0) 0)
+///     (=> (imul $x 1) $x)
+///     ",
+///     Path::new("my-optimizations"),
+/// )?;
+///
+/// // Use the peephole optimizations or serialize them into bytes here...
+/// # Ok(())
+/// # }
+/// ```
+///
+/// ## Visualizing the Peephole Optimizer's Automaton
+///
+/// To visualize (or debug) the peephole optimizer's automaton, set the
+/// `PEEPMATIC_DOT` environment variable to a file path. A [GraphViz
+/// Dot]((https://graphviz.gitlab.io/_pages/pdf/dotguide.pdf)) file showing the
+/// peephole optimizer's automaton will be written to that file path.
+pub fn compile_str(source: &str, filename: &Path) -> anyhow::Result<PeepholeOptimizations> {
+    let buf = wast::parser::ParseBuffer::new(source).map_err(|mut e| {
+        e.set_path(filename);
+        e.set_text(source);
+        e
+    })?;
+
+    let opts = wast::parser::parse::<Optimizations>(&buf).map_err(|mut e| {
+        e.set_path(filename);
+        e.set_text(source);
+        e
+    })?;
+
+    verify(&opts).map_err(|mut e| {
+        e.set_path(filename);
+        e.set_text(source);
+        e
+    })?;
+
+    let mut opts = crate::linearize(&opts);
+    sort_least_to_most_general(&mut opts);
+    remove_unnecessary_nops(&mut opts);
+    match_in_same_order(&mut opts);
+    sort_lexicographically(&mut opts);
+
+    let automata = automatize(&opts);
+    let paths = opts.paths;
+    let integers = opts.integers;
+
+    if let Ok(path) = std::env::var("PEEPMATIC_DOT") {
+        let f = dot_fmt::PeepholeDotFmt(&paths, &integers);
+        if let Err(e) = automata.write_dot_file(&f, &path) {
+            panic!(
+                "failed to write GraphViz Dot file to PEEPMATIC_DOT={}; error: {}",
+                path, e
+            );
+        }
+    }
+
+    Ok(PeepholeOptimizations {
+        paths,
+        integers,
+        automata,
+    })
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn assert_compiles(path: &str) {
+        match compile_file(Path::new(path)) {
+            Ok(_) => return,
+            Err(e) => {
+                eprintln!("error: {}", e);
+                panic!("error: {}", e);
+            }
+        }
+    }
+
+    #[test]
+    fn compile_redundant_bor() {
+        assert_compiles("examples/redundant-bor.peepmatic");
+    }
+
+    #[test]
+    fn mul_by_pow2() {
+        assert_compiles("examples/mul-by-pow2.peepmatic");
+    }
+
+    #[test]
+    fn compile_preopt() {
+        assert_compiles("../codegen/src/preopt.peepmatic");
+    }
+}
diff --git a/cranelift/peepmatic/src/linear_passes.rs b/cranelift/peepmatic/src/linear_passes.rs
new file mode 100644
index 0000000000..9e87ae0036
--- /dev/null
+++ b/cranelift/peepmatic/src/linear_passes.rs
@@ -0,0 +1,719 @@
+//! Passes over the linear IR.
+
+use peepmatic_runtime::{
+    linear,
+    paths::{PathId, PathInterner},
+};
+use std::cmp::Ordering;
+
+/// Sort a set of optimizations from least to most general.
+///
+/// This helps us ensure that we always match the least-general (aka
+/// most-specific) optimization that we can for a particular instruction
+/// sequence.
+///
+/// For example, if we have both of these optimizations:
+///
+/// ```lisp
+/// (=> (imul $C $x)
+///     (imul_imm $C $x))
+///
+/// (=> (when (imul $C $x))
+///           (is-power-of-two $C))
+///     (ishl $x $C))
+/// ```
+///
+/// and we are matching `(imul 4 (..))`, then we want to apply the second
+/// optimization, because it is more specific than the first.
+pub fn sort_least_to_most_general(opts: &mut linear::Optimizations) {
+    let linear::Optimizations {
+        ref mut optimizations,
+        ref paths,
+        ..
+    } = opts;
+
+    // NB: we *cannot* use an unstable sort here, because we want deterministic
+    // compilation of optimizations to automata.
+    optimizations.sort_by(|a, b| compare_optimization_generality(paths, a, b));
+    debug_assert!(is_sorted_by_generality(opts));
+}
+
+/// Sort the linear optimizations lexicographically.
+///
+/// This sort order is required for automata construction.
+pub fn sort_lexicographically(opts: &mut linear::Optimizations) {
+    let linear::Optimizations {
+        ref mut optimizations,
+        ref paths,
+        ..
+    } = opts;
+
+    // NB: we *cannot* use an unstable sort here, same as above.
+    optimizations
+        .sort_by(|a, b| compare_optimizations(paths, a, b, |a_len, b_len| a_len.cmp(&b_len)));
+}
+
+fn compare_optimizations(
+    paths: &PathInterner,
+    a: &linear::Optimization,
+    b: &linear::Optimization,
+    compare_lengths: impl Fn(usize, usize) -> Ordering,
+) -> Ordering {
+    for (a, b) in a.increments.iter().zip(b.increments.iter()) {
+        let c = compare_match_op_generality(paths, a.operation, b.operation);
+        if c != Ordering::Equal {
+            return c;
+        }
+
+        let c = match (a.expected, b.expected) {
+            (Ok(a), Ok(b)) => a.cmp(&b).reverse(),
+            (Err(_), Ok(_)) => Ordering::Greater,
+            (Ok(_), Err(_)) => Ordering::Less,
+            (Err(linear::Else), Err(linear::Else)) => Ordering::Equal,
+        };
+        if c != Ordering::Equal {
+            return c;
+        }
+    }
+
+    compare_lengths(a.increments.len(), b.increments.len())
+}
+
+fn compare_optimization_generality(
+    paths: &PathInterner,
+    a: &linear::Optimization,
+    b: &linear::Optimization,
+) -> Ordering {
+    compare_optimizations(paths, a, b, |a_len, b_len| {
+        // If they shared equivalent prefixes, then compare lengths and invert the
+        // result because longer patterns are less general than shorter patterns.
+        a_len.cmp(&b_len).reverse()
+    })
+}
+
+fn compare_match_op_generality(
+    paths: &PathInterner,
+    a: linear::MatchOp,
+    b: linear::MatchOp,
+) -> Ordering {
+    use linear::MatchOp::*;
+    match (a, b) {
+        (Opcode { path: a }, Opcode { path: b }) => compare_paths(paths, a, b),
+        (Opcode { .. }, _) => Ordering::Less,
+        (_, Opcode { .. }) => Ordering::Greater,
+
+        (IntegerValue { path: a }, IntegerValue { path: b }) => compare_paths(paths, a, b),
+        (IntegerValue { .. }, _) => Ordering::Less,
+        (_, IntegerValue { .. }) => Ordering::Greater,
+
+        (BooleanValue { path: a }, BooleanValue { path: b }) => compare_paths(paths, a, b),
+        (BooleanValue { .. }, _) => Ordering::Less,
+        (_, BooleanValue { .. }) => Ordering::Greater,
+
+        (ConditionCode { path: a }, ConditionCode { path: b }) => compare_paths(paths, a, b),
+        (ConditionCode { .. }, _) => Ordering::Less,
+        (_, ConditionCode { .. }) => Ordering::Greater,
+
+        (IsConst { path: a }, IsConst { path: b }) => compare_paths(paths, a, b),
+        (IsConst { .. }, _) => Ordering::Less,
+        (_, IsConst { .. }) => Ordering::Greater,
+
+        (
+            Eq {
+                path_a: pa1,
+                path_b: pb1,
+            },
+            Eq {
+                path_a: pa2,
+                path_b: pb2,
+            },
+        ) => compare_paths(paths, pa1, pa2).then(compare_paths(paths, pb1, pb2)),
+        (Eq { .. }, _) => Ordering::Less,
+        (_, Eq { .. }) => Ordering::Greater,
+
+        (IsPowerOfTwo { path: a }, IsPowerOfTwo { path: b }) => compare_paths(paths, a, b),
+        (IsPowerOfTwo { .. }, _) => Ordering::Less,
+        (_, IsPowerOfTwo { .. }) => Ordering::Greater,
+
+        (BitWidth { path: a }, BitWidth { path: b }) => compare_paths(paths, a, b),
+        (BitWidth { .. }, _) => Ordering::Less,
+        (_, BitWidth { .. }) => Ordering::Greater,
+
+        (FitsInNativeWord { path: a }, FitsInNativeWord { path: b }) => compare_paths(paths, a, b),
+        (FitsInNativeWord { .. }, _) => Ordering::Less,
+        (_, FitsInNativeWord { .. }) => Ordering::Greater,
+
+        (Nop, Nop) => Ordering::Equal,
+    }
+}
+
+fn compare_paths(paths: &PathInterner, a: PathId, b: PathId) -> Ordering {
+    if a == b {
+        Ordering::Equal
+    } else {
+        let a = paths.lookup(a);
+        let b = paths.lookup(b);
+        a.0.cmp(&b.0)
+    }
+}
+
+/// Are the given optimizations sorted from least to most general?
+pub(crate) fn is_sorted_by_generality(opts: &linear::Optimizations) -> bool {
+    opts.optimizations
+        .windows(2)
+        .all(|w| compare_optimization_generality(&opts.paths, &w[0], &w[1]) <= Ordering::Equal)
+}
+
+/// Are the given optimizations sorted lexicographically?
+pub(crate) fn is_sorted_lexicographically(opts: &linear::Optimizations) -> bool {
+    opts.optimizations.windows(2).all(|w| {
+        compare_optimizations(&opts.paths, &w[0], &w[1], |a_len, b_len| a_len.cmp(&b_len))
+            <= Ordering::Equal
+    })
+}
+
+/// Ensure that we emit match operations in a consistent order.
+///
+/// There are many linear optimizations, each of which have their own sequence
+/// of match operations that need to be tested. But when interpreting the
+/// automata against some instructions, we only perform a single sequence of
+/// match operations, and at any given moment, we only want one match operation
+/// to interpret next. This means that two optimizations that are next to each
+/// other in the sorting must have their shared prefixes diverge on an
+/// **expected result edge**, not on which match operation to preform next. And
+/// if they have zero shared prefix, then we need to create one, that
+/// immediately divereges on the expected result.
+///
+/// For example, consider these two patterns that don't have any shared prefix:
+///
+/// ```lisp
+/// (=> (iadd $x $y) ...)
+/// (=> $C ...)
+/// ```
+///
+/// These produce the following linear match operations and expected results:
+///
+/// ```text
+/// opcode @ 0 --iadd-->
+/// is-const? @ 0 --true-->
+/// ```
+///
+/// In order to ensure that we only have one match operation to interpret at any
+/// given time when evaluating the automata, this pass transforms the second
+/// optimization so that it shares a prefix match operation, but diverges on the
+/// expected result:
+///
+/// ```text
+/// opcode @ 0 --iadd-->
+/// opcode @ 0 --(else)--> is-const? @ 0 --true-->
+/// ```
+pub fn match_in_same_order(opts: &mut linear::Optimizations) {
+    assert!(!opts.optimizations.is_empty());
+
+    let mut prefix = vec![];
+
+    for opt in &mut opts.optimizations {
+        assert!(!opt.increments.is_empty());
+
+        let mut old_increments = opt.increments.iter().peekable();
+        let mut new_increments = vec![];
+
+        for (last_op, last_expected) in &prefix {
+            match old_increments.peek() {
+                None => {
+                    break;
+                }
+                Some(inc) if *last_op == inc.operation => {
+                    let inc = old_increments.next().unwrap();
+                    new_increments.push(inc.clone());
+                    if inc.expected != *last_expected {
+                        break;
+                    }
+                }
+                Some(_) => {
+                    new_increments.push(linear::Increment {
+                        operation: *last_op,
+                        expected: Err(linear::Else),
+                        actions: vec![],
+                    });
+                    if last_expected.is_ok() {
+                        break;
+                    }
+                }
+            }
+        }
+
+        new_increments.extend(old_increments.cloned());
+        assert!(new_increments.len() >= opt.increments.len());
+        opt.increments = new_increments;
+
+        prefix.clear();
+        prefix.extend(
+            opt.increments
+                .iter()
+                .map(|inc| (inc.operation, inc.expected)),
+        );
+    }
+
+    // Should still be sorted after this pass.
+    debug_assert!(is_sorted_by_generality(&opts));
+}
+
+/// 99.99% of nops are unnecessary; remove them.
+///
+/// They're only needed for when a LHS pattern is just a variable, and that's
+/// it. However, it is easier to have basically unused nop matching operations
+/// for the DSL's edge-cases than it is to try and statically eliminate their
+/// existence completely. So we just emit nop match operations for all variable
+/// patterns, and then in this post-processing pass, we fuse them and their
+/// actions with their preceding increment.
+pub fn remove_unnecessary_nops(opts: &mut linear::Optimizations) {
+    for opt in &mut opts.optimizations {
+        if opt.increments.len() < 2 {
+            debug_assert!(!opt.increments.is_empty());
+            continue;
+        }
+
+        for i in (1..opt.increments.len()).rev() {
+            if let linear::MatchOp::Nop = opt.increments[i].operation {
+                let nop = opt.increments.remove(i);
+                opt.increments[i - 1].actions.extend(nop.actions);
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::ast::*;
+    use peepmatic_runtime::{
+        linear::{bool_to_match_result, Else, MatchOp::*, MatchResult},
+        operator::Operator,
+        paths::*,
+    };
+    use std::num::NonZeroU32;
+
+    #[test]
+    fn ok_non_zero_less_than_err_else() {
+        assert!(Ok(NonZeroU32::new(1).unwrap()) < Err(Else));
+    }
+
+    macro_rules! sorts_to {
+        ($test_name:ident, $source:expr, $make_expected:expr) => {
+            #[test]
+            #[allow(unused_variables)]
+            fn $test_name() {
+                let buf = wast::parser::ParseBuffer::new($source).expect("should lex OK");
+
+                let opts = match wast::parser::parse::<Optimizations>(&buf) {
+                    Ok(opts) => opts,
+                    Err(mut e) => {
+                        e.set_path(std::path::Path::new(stringify!($test_name)));
+                        e.set_text($source);
+                        eprintln!("{}", e);
+                        panic!("should parse OK")
+                    }
+                };
+
+                if let Err(mut e) = crate::verify(&opts) {
+                    e.set_path(std::path::Path::new(stringify!($test_name)));
+                    e.set_text($source);
+                    eprintln!("{}", e);
+                    panic!("should verify OK")
+                }
+
+                let mut opts = crate::linearize(&opts);
+
+                let before = opts
+                    .optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| format!("{:?} == {:?}", i.operation, i.expected))
+                            .collect::<Vec<_>>()
+                    })
+                    .collect::<Vec<_>>();
+                eprintln!("before = {:#?}", before);
+
+                sort_least_to_most_general(&mut opts);
+
+                let after = opts
+                    .optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| format!("{:?} == {:?}", i.operation, i.expected))
+                            .collect::<Vec<_>>()
+                    })
+                    .collect::<Vec<_>>();
+                eprintln!("after = {:#?}", before);
+
+                let linear::Optimizations {
+                    mut paths,
+                    mut integers,
+                    optimizations,
+                } = opts;
+
+                let actual: Vec<Vec<_>> = optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| (i.operation, i.expected))
+                            .collect()
+                    })
+                    .collect();
+
+                let mut p = |p: &[u8]| paths.intern(Path::new(&p));
+                let mut i = |i: u64| Ok(integers.intern(i).into());
+                let expected = $make_expected(&mut p, &mut i);
+
+                assert_eq!(expected, actual);
+            }
+        };
+    }
+
+    macro_rules! match_in_same_order {
+        ($test_name:ident, $source:expr, $make_expected:expr) => {
+            #[test]
+            #[allow(unused_variables)]
+            fn $test_name() {
+                let buf = wast::parser::ParseBuffer::new($source).expect("should lex OK");
+
+                let opts = match wast::parser::parse::<Optimizations>(&buf) {
+                    Ok(opts) => opts,
+                    Err(mut e) => {
+                        e.set_path(std::path::Path::new(stringify!($test_name)));
+                        e.set_text($source);
+                        eprintln!("{}", e);
+                        panic!("should parse OK")
+                    }
+                };
+
+                if let Err(mut e) = crate::verify(&opts) {
+                    e.set_path(std::path::Path::new(stringify!($test_name)));
+                    e.set_text($source);
+                    eprintln!("{}", e);
+                    panic!("should verify OK")
+                }
+
+                let mut opts = crate::linearize(&opts);
+                sort_least_to_most_general(&mut opts);
+
+                let before = opts
+                    .optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| format!("{:?} == {:?}", i.operation, i.expected))
+                            .collect::<Vec<_>>()
+                    })
+                    .collect::<Vec<_>>();
+                eprintln!("before = {:#?}", before);
+
+                match_in_same_order(&mut opts);
+
+                let after = opts
+                    .optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| format!("{:?} == {:?}", i.operation, i.expected))
+                            .collect::<Vec<_>>()
+                    })
+                    .collect::<Vec<_>>();
+                eprintln!("after = {:#?}", before);
+
+                let linear::Optimizations {
+                    mut paths,
+                    mut integers,
+                    optimizations,
+                } = opts;
+
+                let actual: Vec<Vec<_>> = optimizations
+                    .iter()
+                    .map(|o| {
+                        o.increments
+                            .iter()
+                            .map(|i| (i.operation, i.expected))
+                            .collect()
+                    })
+                    .collect();
+
+                let mut p = |p: &[u8]| paths.intern(Path::new(&p));
+                let mut i = |i: u64| Ok(integers.intern(i).into());
+                let expected = $make_expected(&mut p, &mut i);
+
+                assert_eq!(expected, actual);
+            }
+        };
+    }
+
+    sorts_to!(
+        test_sort_least_to_most_general,
+        "
+(=>       $x                                 0)
+(=>       (iadd $x $y)                       0)
+(=>       (iadd $x $x)                       0)
+(=>       (iadd $x $C)                       0)
+(=> (when (iadd $x $C) (is-power-of-two $C)) 0)
+(=> (when (iadd $x $C) (bit-width $x 32))    0)
+(=>       (iadd $x 42)                       0)
+(=>       (iadd $x (iadd $y $z))             0)
+",
+        |p: &mut dyn FnMut(&[u8]) -> PathId, i: &mut dyn FnMut(u64) -> MatchResult| vec![
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (
+                    Opcode { path: p(&[0, 1]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IntegerValue { path: p(&[0, 1]) }, i(42))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IsConst { path: p(&[0, 1]) }, bool_to_match_result(true)),
+                (
+                    IsPowerOfTwo { path: p(&[0, 1]) },
+                    bool_to_match_result(true)
+                )
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IsConst { path: p(&[0, 1]) }, bool_to_match_result(true)),
+                (
+                    BitWidth { path: p(&[0, 0]) },
+                    Ok(NonZeroU32::new(32).unwrap())
+                )
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IsConst { path: p(&[0, 1]) }, bool_to_match_result(true))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0]),
+                    },
+                    bool_to_match_result(true)
+                )
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+            ],
+            vec![(Nop, Err(Else))]
+        ]
+    );
+
+    sorts_to!(
+        expected_edges_are_sorted,
+        "
+(=> (iadd 0 $x) $x)
+(=> (iadd $x 0) $x)
+(=> (imul 1 $x) $x)
+(=> (imul $x 1) $x)
+(=> (imul 2 $x) (ishl $x 1))
+(=> (imul $x 2) (ishl $x 1))
+",
+        |p: &mut dyn FnMut(&[u8]) -> PathId, i: &mut dyn FnMut(u64) -> MatchResult| vec![
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Imul as _).unwrap())
+                ),
+                (IntegerValue { path: p(&[0, 0]) }, i(2)),
+                (Nop, Err(Else))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Imul as _).unwrap())
+                ),
+                (IntegerValue { path: p(&[0, 0]) }, i(1)),
+                (Nop, Err(Else))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Imul as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IntegerValue { path: p(&[0, 1]) }, i(2))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Imul as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IntegerValue { path: p(&[0, 1]) }, i(1))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (IntegerValue { path: p(&[0, 0]) }, i(0)),
+                (Nop, Err(Else))
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Iadd as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (IntegerValue { path: p(&[0, 1]) }, i(0))
+            ]
+        ]
+    );
+
+    sorts_to!(
+        sort_redundant_bor,
+        "
+        (=> (bor (bor $x $y) $x)
+            (bor $x $y))
+
+        (=> (bor (bor $x $y) $y)
+            (bor $x $y))
+        ",
+        |p: &mut dyn FnMut(&[u8]) -> PathId, i: &mut dyn FnMut(u64) -> MatchResult| vec![
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (
+                    Opcode { path: p(&[0, 0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0, 0]),
+                    },
+                    bool_to_match_result(true)
+                ),
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (
+                    Opcode { path: p(&[0, 0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0, 1]),
+                    },
+                    bool_to_match_result(true)
+                ),
+            ],
+        ]
+    );
+
+    match_in_same_order!(
+        match_in_same_order_redundant_bor,
+        "
+        (=> (bor (bor $x $y) $x)
+            (bor $x $y))
+
+        (=> (bor (bor $x $y) $y)
+            (bor $x $y))
+        ",
+        |p: &mut dyn FnMut(&[u8]) -> PathId, i: &mut dyn FnMut(u64) -> MatchResult| vec![
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (
+                    Opcode { path: p(&[0, 0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0, 0]),
+                    },
+                    bool_to_match_result(true)
+                ),
+            ],
+            vec![
+                (
+                    Opcode { path: p(&[0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (
+                    Opcode { path: p(&[0, 0]) },
+                    Ok(NonZeroU32::new(Operator::Bor as _).unwrap())
+                ),
+                (Nop, Err(Else)),
+                (Nop, Err(Else)),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0, 0]),
+                    },
+                    Err(Else),
+                ),
+                (
+                    Eq {
+                        path_a: p(&[0, 1]),
+                        path_b: p(&[0, 0, 1]),
+                    },
+                    bool_to_match_result(true)
+                ),
+            ],
+        ]
+    );
+}
diff --git a/cranelift/peepmatic/src/linearize.rs b/cranelift/peepmatic/src/linearize.rs
new file mode 100644
index 0000000000..9f7c1fe602
--- /dev/null
+++ b/cranelift/peepmatic/src/linearize.rs
@@ -0,0 +1,812 @@
+//! Convert an AST into its linear equivalent.
+//!
+//! Convert each optimization's left-hand side into a linear series of match
+//! operations. This makes it easy to create an automaton, because automatas
+//! typically deal with a linear sequence of inputs. The optimization's
+//! right-hand side is built incrementally inside actions that are taken on
+//! transitions between match operations.
+//!
+//! See `crates/runtime/src/linear.rs` for the linear datatype definitions.
+//!
+//! ## Example
+//!
+//! As an example, if we linearize this optimization:
+//!
+//! ```lisp
+//! (=> (when (imul $x $C)
+//!           (is-power-of-two $C))
+//!     (ishl $x $(log2 C)))
+//! ```
+//!
+//! Then we should get the following linear chain of "increments":
+//!
+//! ```ignore
+//! [
+//!   // ( Match Operation, Expected Value, Actions )
+//!   ( Opcode@0,           imul,           [$x = GetLhs@0.0, $C = GetLhs@0.1, ...] ),
+//!   ( IsConst(C),         true,           [] ),
+//!   ( IsPowerOfTwo(C),    true,           [] ),
+//! ]
+//! ```
+//!
+//! Each increment will essentially become a state and a transition out of that
+//! state in the final automata, along with the actions to perform when taking
+//! that transition. The actions record the scope of matches from the left-hand
+//! side and also incrementally build the right-hand side's instructions. (Note
+//! that we've elided the actions that build up the optimization's right-hand
+//! side in this example.)
+//!
+//! ## General Principles
+//!
+//! Here are the general principles that linearization should adhere to:
+//!
+//! * Actions should be pushed as early in the optimization's increment chain as
+//!   they can be. This means the tail has fewer side effects, and is therefore
+//!   more likely to be share-able with other optimizations in the automata that
+//!   we build.
+//!
+//! * RHS actions cannot reference matches from the LHS until they've been
+//!   defined. And finally, an RHS operation's operands must be defined before
+//!   the RHS operation itself. In general, definitions must come before uses!
+//!
+//! * Shorter increment chains are better! This means fewer tests when matching
+//!   left-hand sides, and a more-compact, more-cache-friendly automata, and
+//!   ultimately, a faster automata.
+//!
+//! * An increment's match operation should be a switch rather than a predicate
+//!   that returns a boolean. For example, we switch on an instruction's opcode,
+//!   rather than ask whether this operation is an `imul`. This allows for more
+//!   prefix sharing in the automata, which (again) makes it more compact and
+//!   more cache friendly.
+//!
+//! ## Implementation Overview
+//!
+//! We emit match operations for a left-hand side's pattern structure, followed
+//! by match operations for its preconditions on that structure. This ensures
+//! that anything bound in the pattern is defined before it is used in
+//! precondition.
+//!
+//! Within matching the pattern structure, we emit matching operations in a
+//! pre-order traversal of the pattern. This ensures that we've already matched
+//! an operation before we consider its operands, and therefore we already know
+//! the operands exist. See `PatternPreOrder` for details.
+//!
+//! As we define the match operations for a pattern, we remember the path where
+//! each LHS id first occurred. These will later be reused when building the RHS
+//! actions. See `LhsIdToPath` for details.
+//!
+//! After we've generated the match operations and expected result of those
+//! match operations, then we generate the right-hand side actions. The
+//! right-hand side is built up a post-order traversal, so that operands are
+//! defined before they are used. See `RhsPostOrder` and `RhsBuilder` for
+//! details.
+//!
+//! Finally, see `linearize_optimization` for the the main AST optimization into
+//! linear optimization translation function.
+
+use crate::ast::*;
+use crate::traversals::Dfs;
+use peepmatic_runtime::{
+    integer_interner::IntegerInterner,
+    linear,
+    paths::{Path, PathId, PathInterner},
+};
+use std::collections::BTreeMap;
+use std::convert::TryInto;
+use std::num::NonZeroU32;
+use wast::Id;
+
+/// Translate the given AST optimizations into linear optimizations.
+pub fn linearize(opts: &Optimizations) -> linear::Optimizations {
+    let mut optimizations = vec![];
+    let mut paths = PathInterner::new();
+    let mut integers = IntegerInterner::new();
+    for opt in &opts.optimizations {
+        let lin_opt = linearize_optimization(&mut paths, &mut integers, opt);
+        optimizations.push(lin_opt);
+    }
+    linear::Optimizations {
+        optimizations,
+        paths,
+        integers,
+    }
+}
+
+/// Translate an AST optimization into a linear optimization!
+fn linearize_optimization(
+    paths: &mut PathInterner,
+    integers: &mut IntegerInterner,
+    opt: &Optimization,
+) -> linear::Optimization {
+    let mut increments: Vec<linear::Increment> = vec![];
+
+    let mut lhs_id_to_path = LhsIdToPath::new();
+
+    // We do a pre-order traversal of the LHS because we don't know whether a
+    // child actually exists to match on until we've matched its parent, and we
+    // don't want to emit matching operations on things that might not exist!
+    let mut patterns = PatternPreOrder::new(&opt.lhs.pattern);
+    while let Some((path, pattern)) = patterns.next(paths) {
+        // Create the matching parts of an `Increment` for this part of the
+        // pattern, without any actions yet.
+        let (operation, expected) = pattern.to_linear_match_op(integers, &lhs_id_to_path, path);
+        increments.push(linear::Increment {
+            operation,
+            expected,
+            actions: vec![],
+        });
+
+        lhs_id_to_path.remember_path_to_pattern_ids(pattern, path);
+
+        // Some operations require type ascriptions for us to infer the correct
+        // bit width of their results: `ireduce`, `sextend`, `uextend`, etc.
+        // When there is such a type ascription in the pattern, insert another
+        // increment that checks the instruction-being-matched's bit width.
+        if let Pattern::Operation(Operation { r#type, .. }) = pattern {
+            if let Some(w) = r#type.get().and_then(|ty| ty.bit_width.fixed_width()) {
+                debug_assert!(w != 0, "All fixed-width bit widths are non-zero");
+                let expected = Ok(unsafe { NonZeroU32::new_unchecked(w as u32) });
+
+                increments.push(linear::Increment {
+                    operation: linear::MatchOp::BitWidth { path },
+                    expected,
+                    actions: vec![],
+                });
+            }
+        }
+    }
+
+    // Now that we've added all the increments for the LHS pattern, add the
+    // increments for its preconditions.
+    for pre in &opt.lhs.preconditions {
+        increments.push(pre.to_linear_increment(&lhs_id_to_path));
+    }
+
+    assert!(!increments.is_empty());
+
+    // Finally, generate the RHS-building actions and attach them to the first increment.
+    let mut rhs_builder = RhsBuilder::new(&opt.rhs);
+    rhs_builder.add_rhs_build_actions(integers, &lhs_id_to_path, &mut increments[0].actions);
+
+    linear::Optimization { increments }
+}
+
+/// A post-order, depth-first traversal of right-hand sides.
+///
+/// Does not maintain any extra state about the traversal, such as where in the
+/// tree each yielded node comes from.
+struct RhsPostOrder<'a> {
+    dfs: Dfs<'a>,
+}
+
+impl<'a> RhsPostOrder<'a> {
+    fn new(rhs: &'a Rhs<'a>) -> Self {
+        Self { dfs: Dfs::new(rhs) }
+    }
+}
+
+impl<'a> Iterator for RhsPostOrder<'a> {
+    type Item = &'a Rhs<'a>;
+
+    fn next(&mut self) -> Option<&'a Rhs<'a>> {
+        use crate::traversals::TraversalEvent as TE;
+        loop {
+            match self.dfs.next()? {
+                (TE::Exit, DynAstRef::Rhs(rhs)) => return Some(rhs),
+                _ => continue,
+            }
+        }
+    }
+}
+
+/// A pre-order, depth-first traversal of left-hand side patterns.
+///
+/// Keeps track of the path to each pattern, and yields it along side the
+/// pattern AST node.
+struct PatternPreOrder<'a> {
+    last_child: Option<u8>,
+    path: Vec<u8>,
+    dfs: Dfs<'a>,
+}
+
+impl<'a> PatternPreOrder<'a> {
+    fn new(pattern: &'a Pattern<'a>) -> Self {
+        Self {
+            last_child: None,
+            path: vec![],
+            dfs: Dfs::new(pattern),
+        }
+    }
+
+    fn next(&mut self, paths: &mut PathInterner) -> Option<(PathId, &'a Pattern<'a>)> {
+        use crate::traversals::TraversalEvent as TE;
+        loop {
+            match self.dfs.next()? {
+                (TE::Enter, DynAstRef::Pattern(pattern)) => {
+                    let last_child = self.last_child.take();
+                    self.path.push(match last_child {
+                        None => 0,
+                        Some(c) => {
+                            assert!(
+                                c < std::u8::MAX,
+                                "operators must have less than or equal u8::MAX arity"
+                            );
+                            c + 1
+                        }
+                    });
+                    let path = paths.intern(Path(&self.path));
+                    return Some((path, pattern));
+                }
+                (TE::Exit, DynAstRef::Pattern(_)) => {
+                    self.last_child = Some(
+                        self.path
+                            .pop()
+                            .expect("should always have a non-empty path during traversal"),
+                    );
+                }
+                _ => {}
+            }
+        }
+    }
+}
+
+/// A map from left-hand side identifiers to the path in the left-hand side
+/// where they first occurred.
+struct LhsIdToPath<'a> {
+    id_to_path: BTreeMap<&'a str, PathId>,
+}
+
+impl<'a> LhsIdToPath<'a> {
+    /// Construct a new, empty `LhsIdToPath`.
+    fn new() -> Self {
+        Self {
+            id_to_path: Default::default(),
+        }
+    }
+
+    /// Have we already seen the given identifier?
+    fn get_first_occurrence(&self, id: &Id) -> Option<PathId> {
+        self.id_to_path.get(id.name()).copied()
+    }
+
+    /// Get the path within the left-hand side pattern where we first saw the
+    /// given AST id.
+    ///
+    /// ## Panics
+    ///
+    /// Panics if the given AST id has not already been canonicalized.
+    fn unwrap_first_occurrence(&self, id: &Id) -> PathId {
+        self.id_to_path[id.name()]
+    }
+
+    /// Remember the path to any LHS ids used in the given pattern.
+    fn remember_path_to_pattern_ids(&mut self, pattern: &'a Pattern<'a>, path: PathId) {
+        match pattern {
+            // If this is the first time we've seen an identifier defined on the
+            // left-hand side, remember it.
+            Pattern::Variable(Variable { id, .. }) | Pattern::Constant(Constant { id, .. }) => {
+                self.id_to_path.entry(id.name()).or_insert(path);
+            }
+            _ => {}
+        }
+    }
+}
+
+/// An `RhsBuilder` emits the actions for building the right-hand side
+/// instructions.
+struct RhsBuilder<'a> {
+    // We do a post order traversal of the RHS because an RHS instruction cannot
+    // be created until after all of its operands are created.
+    rhs_post_order: RhsPostOrder<'a>,
+
+    // A map from a right-hand side's span to its `linear::RhsId`. This is used
+    // by RHS-construction actions to reference operands. In practice the
+    // `RhsId` is roughly equivalent to its index in the post-order traversal of
+    // the RHS.
+    rhs_span_to_id: BTreeMap<wast::Span, linear::RhsId>,
+}
+
+impl<'a> RhsBuilder<'a> {
+    /// Create a new builder for the given right-hand side.
+    fn new(rhs: &'a Rhs<'a>) -> Self {
+        let rhs_post_order = RhsPostOrder::new(rhs);
+        let rhs_span_to_id = Default::default();
+        Self {
+            rhs_post_order,
+            rhs_span_to_id,
+        }
+    }
+
+    /// Get the `linear::RhsId` for the given right-hand side.
+    ///
+    /// ## Panics
+    ///
+    /// Panics if we haven't already emitted the action for building this RHS's
+    /// instruction.
+    fn get_rhs_id(&self, rhs: &Rhs) -> linear::RhsId {
+        self.rhs_span_to_id[&rhs.span()]
+    }
+
+    /// Create actions for building up this right-hand side of an optimization.
+    ///
+    /// Because we are walking the right-hand side with a post-order traversal,
+    /// we know that we already created an instruction's operands that are
+    /// defined in the right-hand side, before we get to the parent instruction.
+    fn add_rhs_build_actions(
+        &mut self,
+        integers: &mut IntegerInterner,
+        lhs_id_to_path: &LhsIdToPath,
+        actions: &mut Vec<linear::Action>,
+    ) {
+        while let Some(rhs) = self.rhs_post_order.next() {
+            actions.push(self.rhs_to_linear_action(integers, lhs_id_to_path, rhs));
+            let id = linear::RhsId(self.rhs_span_to_id.len().try_into().unwrap());
+            self.rhs_span_to_id.insert(rhs.span(), id);
+        }
+    }
+
+    fn rhs_to_linear_action(
+        &self,
+        integers: &mut IntegerInterner,
+        lhs_id_to_path: &LhsIdToPath,
+        rhs: &Rhs,
+    ) -> linear::Action {
+        match rhs {
+            Rhs::ValueLiteral(ValueLiteral::Integer(i)) => linear::Action::MakeIntegerConst {
+                value: integers.intern(i.value as u64),
+                bit_width: i
+                    .bit_width
+                    .get()
+                    .expect("should be initialized after type checking"),
+            },
+            Rhs::ValueLiteral(ValueLiteral::Boolean(b)) => linear::Action::MakeBooleanConst {
+                value: b.value,
+                bit_width: b
+                    .bit_width
+                    .get()
+                    .expect("should be initialized after type checking"),
+            },
+            Rhs::ValueLiteral(ValueLiteral::ConditionCode(ConditionCode { cc, .. })) => {
+                linear::Action::MakeConditionCode { cc: *cc }
+            }
+            Rhs::Variable(Variable { id, .. }) | Rhs::Constant(Constant { id, .. }) => {
+                let path = lhs_id_to_path.unwrap_first_occurrence(id);
+                linear::Action::GetLhs { path }
+            }
+            Rhs::Unquote(unq) => match unq.operands.len() {
+                1 => linear::Action::UnaryUnquote {
+                    operator: unq.operator,
+                    operand: self.get_rhs_id(&unq.operands[0]),
+                },
+                2 => linear::Action::BinaryUnquote {
+                    operator: unq.operator,
+                    operands: [
+                        self.get_rhs_id(&unq.operands[0]),
+                        self.get_rhs_id(&unq.operands[1]),
+                    ],
+                },
+                n => unreachable!("no unquote operators of arity {}", n),
+            },
+            Rhs::Operation(op) => match op.operands.len() {
+                1 => linear::Action::MakeUnaryInst {
+                    operator: op.operator,
+                    r#type: op
+                        .r#type
+                        .get()
+                        .expect("should be initialized after type checking"),
+                    operand: self.get_rhs_id(&op.operands[0]),
+                },
+                2 => linear::Action::MakeBinaryInst {
+                    operator: op.operator,
+                    r#type: op
+                        .r#type
+                        .get()
+                        .expect("should be initialized after type checking"),
+                    operands: [
+                        self.get_rhs_id(&op.operands[0]),
+                        self.get_rhs_id(&op.operands[1]),
+                    ],
+                },
+                3 => linear::Action::MakeTernaryInst {
+                    operator: op.operator,
+                    r#type: op
+                        .r#type
+                        .get()
+                        .expect("should be initialized after type checking"),
+                    operands: [
+                        self.get_rhs_id(&op.operands[0]),
+                        self.get_rhs_id(&op.operands[1]),
+                        self.get_rhs_id(&op.operands[2]),
+                    ],
+                },
+                n => unreachable!("no instructions of arity {}", n),
+            },
+        }
+    }
+}
+
+impl Precondition<'_> {
+    /// Convert this precondition into a `linear::Increment`.
+    fn to_linear_increment(&self, lhs_id_to_path: &LhsIdToPath) -> linear::Increment {
+        match self.constraint {
+            Constraint::IsPowerOfTwo => {
+                let id = match &self.operands[0] {
+                    ConstraintOperand::Constant(Constant { id, .. }) => id,
+                    _ => unreachable!("checked in verification"),
+                };
+                let path = lhs_id_to_path.unwrap_first_occurrence(&id);
+                linear::Increment {
+                    operation: linear::MatchOp::IsPowerOfTwo { path },
+                    expected: linear::bool_to_match_result(true),
+                    actions: vec![],
+                }
+            }
+            Constraint::BitWidth => {
+                let id = match &self.operands[0] {
+                    ConstraintOperand::Constant(Constant { id, .. })
+                    | ConstraintOperand::Variable(Variable { id, .. }) => id,
+                    _ => unreachable!("checked in verification"),
+                };
+                let path = lhs_id_to_path.unwrap_first_occurrence(&id);
+
+                let width = match &self.operands[1] {
+                    ConstraintOperand::ValueLiteral(ValueLiteral::Integer(Integer {
+                        value,
+                        ..
+                    })) => *value,
+                    _ => unreachable!("checked in verification"),
+                };
+
+                assert!(0 < width && width <= 128);
+                assert!((width as u8).is_power_of_two());
+                let expected = Ok(unsafe { NonZeroU32::new_unchecked(width as u32) });
+
+                linear::Increment {
+                    operation: linear::MatchOp::BitWidth { path },
+                    expected,
+                    actions: vec![],
+                }
+            }
+            Constraint::FitsInNativeWord => {
+                let id = match &self.operands[0] {
+                    ConstraintOperand::Constant(Constant { id, .. })
+                    | ConstraintOperand::Variable(Variable { id, .. }) => id,
+                    _ => unreachable!("checked in verification"),
+                };
+                let path = lhs_id_to_path.unwrap_first_occurrence(&id);
+                linear::Increment {
+                    operation: linear::MatchOp::FitsInNativeWord { path },
+                    expected: linear::bool_to_match_result(true),
+                    actions: vec![],
+                }
+            }
+        }
+    }
+}
+
+impl Pattern<'_> {
+    /// Convert this pattern into its linear match operation and the expected
+    /// result of that operation.
+    ///
+    /// NB: these mappings to expected values need to stay sync'd with the
+    /// runtime!
+    fn to_linear_match_op(
+        &self,
+        integers: &mut IntegerInterner,
+        lhs_id_to_path: &LhsIdToPath,
+        path: PathId,
+    ) -> (linear::MatchOp, linear::MatchResult) {
+        match self {
+            Pattern::ValueLiteral(ValueLiteral::Integer(Integer { value, .. })) => (
+                linear::MatchOp::IntegerValue { path },
+                Ok(integers.intern(*value as u64).into()),
+            ),
+            Pattern::ValueLiteral(ValueLiteral::Boolean(Boolean { value, .. })) => (
+                linear::MatchOp::BooleanValue { path },
+                linear::bool_to_match_result(*value),
+            ),
+            Pattern::ValueLiteral(ValueLiteral::ConditionCode(ConditionCode { cc, .. })) => {
+                let cc = *cc as u32;
+                debug_assert!(cc != 0, "no `ConditionCode` variants are zero");
+                let expected = Ok(unsafe { NonZeroU32::new_unchecked(cc) });
+                (linear::MatchOp::ConditionCode { path }, expected)
+            }
+            Pattern::Constant(Constant { id, .. }) => {
+                if let Some(path_b) = lhs_id_to_path.get_first_occurrence(id) {
+                    debug_assert!(path != path_b);
+                    (
+                        linear::MatchOp::Eq {
+                            path_a: path,
+                            path_b,
+                        },
+                        linear::bool_to_match_result(true),
+                    )
+                } else {
+                    (
+                        linear::MatchOp::IsConst { path },
+                        linear::bool_to_match_result(true),
+                    )
+                }
+            }
+            Pattern::Variable(Variable { id, .. }) => {
+                if let Some(path_b) = lhs_id_to_path.get_first_occurrence(id) {
+                    debug_assert!(path != path_b);
+                    (
+                        linear::MatchOp::Eq {
+                            path_a: path,
+                            path_b,
+                        },
+                        linear::bool_to_match_result(true),
+                    )
+                } else {
+                    (linear::MatchOp::Nop, Err(linear::Else))
+                }
+            }
+            Pattern::Operation(op) => {
+                let op = op.operator as u32;
+                debug_assert!(op != 0, "no `Operator` variants are zero");
+                let expected = Ok(unsafe { NonZeroU32::new_unchecked(op) });
+                (linear::MatchOp::Opcode { path }, expected)
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use peepmatic_runtime::{
+        integer_interner::IntegerId,
+        linear::{bool_to_match_result, Action::*, Else, MatchOp::*},
+        operator::Operator,
+        r#type::{BitWidth, Kind, Type},
+    };
+
+    macro_rules! linearizes_to {
+        ($name:ident, $source:expr, $make_expected:expr $(,)* ) => {
+            #[test]
+            fn $name() {
+                let buf = wast::parser::ParseBuffer::new($source).expect("should lex OK");
+
+                let opts = match wast::parser::parse::<Optimizations>(&buf) {
+                    Ok(opts) => opts,
+                    Err(mut e) => {
+                        e.set_path(std::path::Path::new(stringify!($name)));
+                        e.set_text($source);
+                        eprintln!("{}", e);
+                        panic!("should parse OK")
+                    }
+                };
+
+                assert_eq!(
+                    opts.optimizations.len(),
+                    1,
+                    "`linearizes_to!` only supports a single optimization; split the big test into \
+                     multiple small tests"
+                );
+
+                if let Err(mut e) = crate::verify(&opts) {
+                    e.set_path(std::path::Path::new(stringify!($name)));
+                    e.set_text($source);
+                    eprintln!("{}", e);
+                    panic!("should verify OK")
+                }
+
+                let mut paths = PathInterner::new();
+                let mut p = |p: &[u8]| paths.intern(Path::new(&p));
+
+                let mut integers = IntegerInterner::new();
+                let mut i = |i: u64| integers.intern(i);
+
+                #[allow(unused_variables)]
+                let make_expected: fn(
+                    &mut dyn FnMut(&[u8]) -> PathId,
+                    &mut dyn FnMut(u64) -> IntegerId,
+                ) -> Vec<linear::Increment> = $make_expected;
+                let expected = make_expected(&mut p, &mut i);
+                dbg!(&expected);
+
+                let actual = linearize_optimization(&mut paths, &mut integers, &opts.optimizations[0]);
+                dbg!(&actual.increments);
+
+                assert_eq!(expected, actual.increments);
+            }
+        };
+    }
+
+    linearizes_to!(
+        mul_by_pow2_into_shift,
+        "
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $C))
+        ",
+        |p, i| vec![
+            linear::Increment {
+                operation: Opcode { path: p(&[0]) },
+                expected: Ok(NonZeroU32::new(Operator::Imul as _).unwrap()),
+                actions: vec![
+                    GetLhs { path: p(&[0, 0]) },
+                    GetLhs { path: p(&[0, 1]) },
+                    MakeBinaryInst {
+                        operator: Operator::Ishl,
+                        r#type: Type {
+                            kind: Kind::Int,
+                            bit_width: BitWidth::Polymorphic,
+                        },
+                        operands: [linear::RhsId(0), linear::RhsId(1)],
+                    },
+                ],
+            },
+            linear::Increment {
+                operation: Nop,
+                expected: Err(Else),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: IsConst { path: p(&[0, 1]) },
+                expected: bool_to_match_result(true),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: IsPowerOfTwo { path: p(&[0, 1]) },
+                expected: bool_to_match_result(true),
+                actions: vec![],
+            },
+        ],
+    );
+
+    linearizes_to!(variable_pattern_id_optimization, "(=> $x $x)", |p, i| vec![
+        linear::Increment {
+            operation: Nop,
+            expected: Err(Else),
+            actions: vec![GetLhs { path: p(&[0]) }],
+        }
+    ]);
+
+    linearizes_to!(constant_pattern_id_optimization, "(=> $C $C)", |p, i| vec![
+        linear::Increment {
+            operation: IsConst { path: p(&[0]) },
+            expected: bool_to_match_result(true),
+            actions: vec![GetLhs { path: p(&[0]) }],
+        }
+    ]);
+
+    linearizes_to!(
+        boolean_literal_id_optimization,
+        "(=> true true)",
+        |p, i| vec![linear::Increment {
+            operation: BooleanValue { path: p(&[0]) },
+            expected: bool_to_match_result(true),
+            actions: vec![MakeBooleanConst {
+                value: true,
+                bit_width: BitWidth::Polymorphic,
+            }],
+        }]
+    );
+
+    linearizes_to!(number_literal_id_optimization, "(=> 5 5)", |p, i| vec![
+        linear::Increment {
+            operation: IntegerValue { path: p(&[0]) },
+            expected: Ok(i(5).into()),
+            actions: vec![MakeIntegerConst {
+                value: i(5),
+                bit_width: BitWidth::Polymorphic,
+            }],
+        }
+    ]);
+
+    linearizes_to!(
+        operation_id_optimization,
+        "(=> (iconst $C) (iconst $C))",
+        |p, i| vec![
+            linear::Increment {
+                operation: Opcode { path: p(&[0]) },
+                expected: Ok(NonZeroU32::new(Operator::Iconst as _).unwrap()),
+                actions: vec![
+                    GetLhs { path: p(&[0, 0]) },
+                    MakeUnaryInst {
+                        operator: Operator::Iconst,
+                        r#type: Type {
+                            kind: Kind::Int,
+                            bit_width: BitWidth::Polymorphic,
+                        },
+                        operand: linear::RhsId(0),
+                    },
+                ],
+            },
+            linear::Increment {
+                operation: IsConst { path: p(&[0, 0]) },
+                expected: bool_to_match_result(true),
+                actions: vec![],
+            },
+        ]
+    );
+
+    linearizes_to!(
+        redundant_bor,
+        "(=> (bor $x (bor $x $y)) (bor $x $y))",
+        |p, i| vec![
+            linear::Increment {
+                operation: Opcode { path: p(&[0]) },
+                expected: Ok(NonZeroU32::new(Operator::Bor as _).unwrap()),
+                actions: vec![
+                    GetLhs { path: p(&[0, 0]) },
+                    GetLhs {
+                        path: p(&[0, 1, 1]),
+                    },
+                    MakeBinaryInst {
+                        operator: Operator::Bor,
+                        r#type: Type {
+                            kind: Kind::Int,
+                            bit_width: BitWidth::Polymorphic,
+                        },
+                        operands: [linear::RhsId(0), linear::RhsId(1)],
+                    },
+                ],
+            },
+            linear::Increment {
+                operation: Nop,
+                expected: Err(Else),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: Opcode { path: p(&[0, 1]) },
+                expected: Ok(NonZeroU32::new(Operator::Bor as _).unwrap()),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: Eq {
+                    path_a: p(&[0, 1, 0]),
+                    path_b: p(&[0, 0]),
+                },
+                expected: bool_to_match_result(true),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: Nop,
+                expected: Err(Else),
+                actions: vec![],
+            },
+        ]
+    );
+
+    linearizes_to!(
+        large_integers,
+        // u64::MAX
+        "(=> 18446744073709551615 0)",
+        |p, i| vec![linear::Increment {
+            operation: IntegerValue { path: p(&[0]) },
+            expected: Ok(i(std::u64::MAX).into()),
+            actions: vec![MakeIntegerConst {
+                value: i(0),
+                bit_width: BitWidth::Polymorphic,
+            }],
+        }]
+    );
+
+    linearizes_to!(
+        ireduce_with_type_ascription,
+        "(=> (ireduce{i32} $x) 0)",
+        |p, i| vec![
+            linear::Increment {
+                operation: Opcode { path: p(&[0]) },
+                expected: Ok(NonZeroU32::new(Operator::Ireduce as _).unwrap()),
+                actions: vec![MakeIntegerConst {
+                    value: i(0),
+                    bit_width: BitWidth::ThirtyTwo,
+                }],
+            },
+            linear::Increment {
+                operation: linear::MatchOp::BitWidth { path: p(&[0]) },
+                expected: Ok(NonZeroU32::new(32).unwrap()),
+                actions: vec![],
+            },
+            linear::Increment {
+                operation: Nop,
+                expected: Err(Else),
+                actions: vec![],
+            },
+        ]
+    );
+}
diff --git a/cranelift/peepmatic/src/parser.rs b/cranelift/peepmatic/src/parser.rs
new file mode 100644
index 0000000000..19ad49017c
--- /dev/null
+++ b/cranelift/peepmatic/src/parser.rs
@@ -0,0 +1,932 @@
+/*!
+
+This module implements parsing the DSL text format. It implements the
+`wast::Parse` trait for all of our AST types.
+
+The grammar for the DSL is given below:
+
+```ebnf
+<optimizations> ::= <optimization>*
+
+<optimization> ::= '(' '=>' <lhs> <rhs> ')'
+
+<left-hand-side> ::= <pattern>
+                   | '(' 'when' <pattern> <precondition>* ')'
+
+<pattern> ::= <value-literal>
+            | <constant>
+            | <operation<pattern>>
+            | <variable>
+
+<value-literal> ::= <integer>
+                  | <boolean>
+
+<boolean> ::= 'true' | 'false'
+
+<operation<T>> ::= '(' <operator> [<type-ascription>] <T>* ')'
+
+<precondition> ::= '(' <constraint> <constraint-operands>* ')'
+
+<constraint-operand> ::= <value-literal>
+                       | <constant>
+                       | <variable>
+
+<rhs> ::= <value-literal>
+        | <constant>
+        | <variable>
+        | <unquote>
+        | <operation<rhs>>
+
+<unquote> ::= '$' '(' <unquote-operator> <unquote-operand>* ')'
+
+<unquote-operand> ::= <value-literal>
+                    | <constant>
+```
+
+ */
+
+use crate::ast::*;
+use peepmatic_runtime::r#type::Type;
+use std::cell::Cell;
+use std::marker::PhantomData;
+use wast::{
+    parser::{Cursor, Parse, Parser, Peek, Result as ParseResult},
+    Id, LParen,
+};
+
+mod tok {
+    use wast::{custom_keyword, custom_reserved};
+
+    custom_keyword!(bit_width = "bit-width");
+    custom_reserved!(dollar = "$");
+    custom_keyword!(r#false = "false");
+    custom_keyword!(fits_in_native_word = "fits-in-native-word");
+    custom_keyword!(is_power_of_two = "is-power-of-two");
+    custom_reserved!(left_curly = "{");
+    custom_keyword!(log2);
+    custom_keyword!(neg);
+    custom_reserved!(replace = "=>");
+    custom_reserved!(right_curly = "}");
+    custom_keyword!(r#true = "true");
+    custom_keyword!(when);
+
+    custom_keyword!(eq);
+    custom_keyword!(ne);
+    custom_keyword!(slt);
+    custom_keyword!(ult);
+    custom_keyword!(sge);
+    custom_keyword!(uge);
+    custom_keyword!(sgt);
+    custom_keyword!(ugt);
+    custom_keyword!(sle);
+    custom_keyword!(ule);
+    custom_keyword!(of);
+    custom_keyword!(nof);
+}
+
+impl<'a> Parse<'a> for Optimizations<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        let mut optimizations = vec![];
+        while !p.is_empty() {
+            optimizations.push(p.parse()?);
+        }
+        Ok(Optimizations {
+            span,
+            optimizations,
+        })
+    }
+}
+
+impl<'a> Parse<'a> for Optimization<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        p.parens(|p| {
+            p.parse::<tok::replace>()?;
+            let lhs = p.parse()?;
+            let rhs = p.parse()?;
+            Ok(Optimization { span, lhs, rhs })
+        })
+    }
+}
+
+impl<'a> Parse<'a> for Lhs<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        let mut preconditions = vec![];
+        if p.peek::<wast::LParen>() && p.peek2::<tok::when>() {
+            p.parens(|p| {
+                p.parse::<tok::when>()?;
+                let pattern = p.parse()?;
+                while p.peek::<LParen>() {
+                    preconditions.push(p.parse()?);
+                }
+                Ok(Lhs {
+                    span,
+                    pattern,
+                    preconditions,
+                })
+            })
+        } else {
+            let span = p.cur_span();
+            let pattern = p.parse()?;
+            Ok(Lhs {
+                span,
+                pattern,
+                preconditions,
+            })
+        }
+    }
+}
+
+impl<'a> Parse<'a> for Pattern<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        if p.peek::<ValueLiteral>() {
+            return Ok(Pattern::ValueLiteral(p.parse()?));
+        }
+        if p.peek::<Constant>() {
+            return Ok(Pattern::Constant(p.parse()?));
+        }
+        if p.peek::<Operation<Self>>() {
+            return Ok(Pattern::Operation(p.parse()?));
+        }
+        if p.peek::<Variable>() {
+            return Ok(Pattern::Variable(p.parse()?));
+        }
+        Err(p.error("expected a left-hand side pattern"))
+    }
+}
+
+impl<'a> Peek for Pattern<'a> {
+    fn peek(c: Cursor) -> bool {
+        ValueLiteral::peek(c)
+            || Constant::peek(c)
+            || Variable::peek(c)
+            || Operation::<Self>::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "left-hand side pattern"
+    }
+}
+
+impl<'a> Parse<'a> for ValueLiteral<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        if let Ok(b) = p.parse::<Boolean>() {
+            return Ok(ValueLiteral::Boolean(b));
+        }
+        if let Ok(i) = p.parse::<Integer>() {
+            return Ok(ValueLiteral::Integer(i));
+        }
+        if let Ok(cc) = p.parse::<ConditionCode>() {
+            return Ok(ValueLiteral::ConditionCode(cc));
+        }
+        Err(p.error("expected an integer or boolean or condition code literal"))
+    }
+}
+
+impl<'a> Peek for ValueLiteral<'a> {
+    fn peek(c: Cursor) -> bool {
+        c.integer().is_some() || Boolean::peek(c) || ConditionCode::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "value literal"
+    }
+}
+
+impl<'a> Parse<'a> for Integer<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        p.step(|c| {
+            if let Some((i, rest)) = c.integer() {
+                let (s, base) = i.val();
+                let val = i64::from_str_radix(s, base)
+                    .or_else(|_| u128::from_str_radix(s, base).map(|i| i as i64));
+                return match val {
+                    Ok(value) => Ok((
+                        Integer {
+                            span,
+                            value,
+                            bit_width: Default::default(),
+                            marker: PhantomData,
+                        },
+                        rest,
+                    )),
+                    Err(_) => Err(c.error("invalid integer: out of range")),
+                };
+            }
+            Err(c.error("expected an integer"))
+        })
+    }
+}
+
+impl<'a> Parse<'a> for Boolean<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        if p.parse::<tok::r#true>().is_ok() {
+            return Ok(Boolean {
+                span,
+                value: true,
+                bit_width: Default::default(),
+                marker: PhantomData,
+            });
+        }
+        if p.parse::<tok::r#false>().is_ok() {
+            return Ok(Boolean {
+                span,
+                value: false,
+                bit_width: Default::default(),
+                marker: PhantomData,
+            });
+        }
+        Err(p.error("expected `true` or `false`"))
+    }
+}
+
+impl<'a> Peek for Boolean<'a> {
+    fn peek(c: Cursor) -> bool {
+        <tok::r#true as Peek>::peek(c) || <tok::r#false as Peek>::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "boolean `true` or `false`"
+    }
+}
+
+impl<'a> Parse<'a> for ConditionCode<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+
+        macro_rules! parse_cc {
+            ( $( $token:ident => $cc:ident, )* ) => {
+                $(
+                    if p.peek::<tok::$token>() {
+                        p.parse::<tok::$token>()?;
+                        return Ok(Self {
+                            span,
+                            cc: peepmatic_runtime::cc::ConditionCode::$cc,
+                            marker: PhantomData,
+                        });
+                    }
+                )*
+            }
+        }
+
+        parse_cc! {
+            eq => Eq,
+            ne => Ne,
+            slt => Slt,
+            ult => Ult,
+            sge => Sge,
+            uge => Uge,
+            sgt => Sgt,
+            ugt => Ugt,
+            sle => Sle,
+            ule => Ule,
+            of => Of,
+            nof => Nof,
+        }
+
+        Err(p.error("expected a condition code"))
+    }
+}
+
+impl<'a> Peek for ConditionCode<'a> {
+    fn peek(c: Cursor) -> bool {
+        macro_rules! peek_cc {
+            ( $( $token:ident, )* ) => {
+                false $( || <tok::$token as Peek>::peek(c) )*
+            }
+        }
+
+        peek_cc! {
+            eq,
+            ne,
+            slt,
+            ult,
+            sge,
+            uge,
+            sgt,
+            ugt,
+            sle,
+            ule,
+            of,
+            nof,
+        }
+    }
+
+    fn display() -> &'static str {
+        "condition code"
+    }
+}
+
+impl<'a> Parse<'a> for Constant<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        let id = Id::parse(p)?;
+        if id
+            .name()
+            .chars()
+            .all(|c| !c.is_alphabetic() || c.is_uppercase())
+        {
+            Ok(Constant { span, id })
+        } else {
+            let upper = id
+                .name()
+                .chars()
+                .flat_map(|c| c.to_uppercase())
+                .collect::<String>();
+            Err(p.error(format!(
+                "symbolic constants must start with an upper-case letter like ${}",
+                upper
+            )))
+        }
+    }
+}
+
+impl<'a> Peek for Constant<'a> {
+    fn peek(c: Cursor) -> bool {
+        if let Some((id, _rest)) = c.id() {
+            id.chars().all(|c| !c.is_alphabetic() || c.is_uppercase())
+        } else {
+            false
+        }
+    }
+
+    fn display() -> &'static str {
+        "symbolic constant"
+    }
+}
+
+impl<'a> Parse<'a> for Variable<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        let id = Id::parse(p)?;
+        if id
+            .name()
+            .chars()
+            .all(|c| !c.is_alphabetic() || c.is_lowercase())
+        {
+            Ok(Variable { span, id })
+        } else {
+            let lower = id
+                .name()
+                .chars()
+                .flat_map(|c| c.to_lowercase())
+                .collect::<String>();
+            Err(p.error(format!(
+                "variables must start with an lower-case letter like ${}",
+                lower
+            )))
+        }
+    }
+}
+
+impl<'a> Peek for Variable<'a> {
+    fn peek(c: Cursor) -> bool {
+        if let Some((id, _rest)) = c.id() {
+            id.chars().all(|c| !c.is_alphabetic() || c.is_lowercase())
+        } else {
+            false
+        }
+    }
+
+    fn display() -> &'static str {
+        "variable"
+    }
+}
+
+impl<'a, T> Parse<'a> for Operation<'a, T>
+where
+    T: 'a + Ast<'a> + Peek + Parse<'a>,
+    DynAstRef<'a>: From<&'a T>,
+{
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        p.parens(|p| {
+            let operator = p.parse()?;
+
+            let r#type = Cell::new(if p.peek::<tok::left_curly>() {
+                p.parse::<tok::left_curly>()?;
+                let ty = p.parse::<Type>()?;
+                p.parse::<tok::right_curly>()?;
+                Some(ty)
+            } else {
+                None
+            });
+
+            let mut operands = vec![];
+            while p.peek::<T>() {
+                operands.push(p.parse()?);
+            }
+            Ok(Operation {
+                span,
+                operator,
+                r#type,
+                operands,
+                marker: PhantomData,
+            })
+        })
+    }
+}
+
+impl<'a, T> Peek for Operation<'a, T>
+where
+    T: 'a + Ast<'a>,
+    DynAstRef<'a>: From<&'a T>,
+{
+    fn peek(c: Cursor) -> bool {
+        wast::LParen::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "operation"
+    }
+}
+
+impl<'a> Parse<'a> for Precondition<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        p.parens(|p| {
+            let constraint = p.parse()?;
+            let mut operands = vec![];
+            while p.peek::<ConstraintOperand>() {
+                operands.push(p.parse()?);
+            }
+            Ok(Precondition {
+                span,
+                constraint,
+                operands,
+            })
+        })
+    }
+}
+
+impl<'a> Parse<'a> for Constraint {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        if p.peek::<tok::is_power_of_two>() {
+            p.parse::<tok::is_power_of_two>()?;
+            return Ok(Constraint::IsPowerOfTwo);
+        }
+        if p.peek::<tok::bit_width>() {
+            p.parse::<tok::bit_width>()?;
+            return Ok(Constraint::BitWidth);
+        }
+        if p.peek::<tok::fits_in_native_word>() {
+            p.parse::<tok::fits_in_native_word>()?;
+            return Ok(Constraint::FitsInNativeWord);
+        }
+        Err(p.error("expected a precondition constraint"))
+    }
+}
+
+impl<'a> Parse<'a> for ConstraintOperand<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        if p.peek::<ValueLiteral>() {
+            return Ok(ConstraintOperand::ValueLiteral(p.parse()?));
+        }
+        if p.peek::<Constant>() {
+            return Ok(ConstraintOperand::Constant(p.parse()?));
+        }
+        if p.peek::<Variable>() {
+            return Ok(ConstraintOperand::Variable(p.parse()?));
+        }
+        Err(p.error("expected an operand for precondition constraint"))
+    }
+}
+
+impl<'a> Peek for ConstraintOperand<'a> {
+    fn peek(c: Cursor) -> bool {
+        ValueLiteral::peek(c) || Constant::peek(c) || Variable::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "operand for a precondition constraint"
+    }
+}
+
+impl<'a> Parse<'a> for Rhs<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        if p.peek::<ValueLiteral>() {
+            return Ok(Rhs::ValueLiteral(p.parse()?));
+        }
+        if p.peek::<Constant>() {
+            return Ok(Rhs::Constant(p.parse()?));
+        }
+        if p.peek::<Variable>() {
+            return Ok(Rhs::Variable(p.parse()?));
+        }
+        if p.peek::<Unquote>() {
+            return Ok(Rhs::Unquote(p.parse()?));
+        }
+        if p.peek::<Operation<Self>>() {
+            return Ok(Rhs::Operation(p.parse()?));
+        }
+        Err(p.error("expected a right-hand side replacement"))
+    }
+}
+
+impl<'a> Peek for Rhs<'a> {
+    fn peek(c: Cursor) -> bool {
+        ValueLiteral::peek(c)
+            || Constant::peek(c)
+            || Variable::peek(c)
+            || Unquote::peek(c)
+            || Operation::<Self>::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "right-hand side replacement"
+    }
+}
+
+impl<'a> Parse<'a> for Unquote<'a> {
+    fn parse(p: Parser<'a>) -> ParseResult<Self> {
+        let span = p.cur_span();
+        p.parse::<tok::dollar>()?;
+        p.parens(|p| {
+            let operator = p.parse()?;
+            let mut operands = vec![];
+            while p.peek::<Rhs>() {
+                operands.push(p.parse()?);
+            }
+            Ok(Unquote {
+                span,
+                operator,
+                operands,
+            })
+        })
+    }
+}
+
+impl<'a> Peek for Unquote<'a> {
+    fn peek(c: Cursor) -> bool {
+        tok::dollar::peek(c)
+    }
+
+    fn display() -> &'static str {
+        "unquote expression"
+    }
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+    use peepmatic_runtime::operator::Operator;
+
+    macro_rules! test_parse {
+        (
+            $(
+                $name:ident < $ast:ty > {
+                    $( ok { $( $ok:expr , )* } )*
+                    $( err { $( $err:expr , )* } )*
+                }
+            )*
+        ) => {
+            $(
+                #[test]
+                #[allow(non_snake_case)]
+                fn $name() {
+                    $(
+                        $({
+                            let input = $ok;
+                            let buf = wast::parser::ParseBuffer::new(input).unwrap_or_else(|e| {
+                                panic!("should lex OK, got error:\n\n{}\n\nInput:\n\n{}", e, input)
+                            });
+                            if let Err(e) = wast::parser::parse::<$ast>(&buf) {
+                                panic!(
+                                    "expected to parse OK, got error:\n\n{}\n\nInput:\n\n{}",
+                                    e, input
+                                );
+                            }
+                        })*
+                    )*
+
+                    $(
+                        $({
+                            let input = $err;
+                            let buf = wast::parser::ParseBuffer::new(input).unwrap_or_else(|e| {
+                                panic!("should lex OK, got error:\n\n{}\n\nInput:\n\n{}", e, input)
+                            });
+                            if let Ok(ast) = wast::parser::parse::<$ast>(&buf) {
+                                panic!(
+                                    "expected a parse error, got:\n\n{:?}\n\nInput:\n\n{}",
+                                    ast, input
+                                );
+                            }
+                        })*
+                    )*
+                }
+            )*
+        }
+    }
+
+    test_parse! {
+        parse_boolean<Boolean> {
+            ok {
+                "true",
+                "false",
+            }
+            err {
+                "",
+                "t",
+                "tr",
+                "tru",
+                "truezzz",
+                "f",
+                "fa",
+                "fal",
+                "fals",
+                "falsezzz",
+            }
+        }
+        parse_cc<ConditionCode> {
+            ok {
+                "eq",
+                "ne",
+                "slt",
+                "ult",
+                "sge",
+                "uge",
+                "sgt",
+                "ugt",
+                "sle",
+                "ule",
+                "of",
+                "nof",
+            }
+            err {
+                "",
+                "neq",
+            }
+        }
+        parse_constant<Constant> {
+            ok {
+                "$C",
+                "$C1",
+                "$C2",
+                "$X",
+                "$Y",
+                "$SOME-CONSTANT",
+                "$SOME_CONSTANT",
+            }
+            err {
+                "",
+                "zzz",
+                "$",
+                "$variable",
+                "$Some-Constant",
+                "$Some_Constant",
+                "$Some_constant",
+            }
+        }
+        parse_constraint<Constraint> {
+            ok {
+                "is-power-of-two",
+                "bit-width",
+                "fits-in-native-word",
+            }
+            err {
+                "",
+                "iadd",
+                "imul",
+            }
+        }
+        parse_constraint_operand<ConstraintOperand> {
+            ok {
+                "1234",
+                "true",
+                "$CONSTANT",
+                "$variable",
+            }
+            err {
+                "",
+                "is-power-of-two",
+                "(is-power-of-two $C)",
+                "(iadd 1 2)",
+            }
+        }
+        parse_integer<Integer> {
+            ok {
+                "0",
+                "1",
+                "12",
+                "123",
+                "1234",
+                "12345",
+                "123456",
+                "1234567",
+                "12345678",
+                "123456789",
+                "1234567890",
+                "0x0",
+                "0x1",
+                "0x12",
+                "0x123",
+                "0x1234",
+                "0x12345",
+                "0x123456",
+                "0x1234567",
+                "0x12345678",
+                "0x123456789",
+                "0x123456789a",
+                "0x123456789ab",
+                "0x123456789abc",
+                "0x123456789abcd",
+                "0x123456789abcde",
+                "0x123456789abcdef",
+                "0xffff_ffff_ffff_ffff",
+            }
+            err {
+                "",
+                "abcdef",
+                "01234567890abcdef",
+                "0xgggg",
+                "0xfffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffff",
+            }
+        }
+        parse_lhs<Lhs> {
+            ok {
+                "(when (imul $C1 $C2) (is-power-of-two $C1) (is-power-of-two $C2))",
+                "(when (imul $x $C) (is-power-of-two $C))",
+                "(imul $x $y)",
+                "(imul $x)",
+                "(imul)",
+                "$C",
+                "$x",
+            }
+            err {
+                "",
+                "()",
+                "abc",
+            }
+        }
+        parse_operation_pattern<Operation<Pattern>> {
+            ok {
+                "(iadd)",
+                "(iadd 1)",
+                "(iadd 1 2)",
+                "(iadd $x $C)",
+                "(iadd{i32} $x $y)",
+                "(icmp eq $x $y)",
+            }
+            err {
+                "",
+                "()",
+                "$var",
+                "$CONST",
+                "(ishl $x $(log2 $C))",
+            }
+        }
+        parse_operation_rhs<Operation<Rhs>> {
+            ok {
+                "(iadd)",
+                "(iadd 1)",
+                "(iadd 1 2)",
+                "(ishl $x $(log2 $C))",
+            }
+            err {
+                "",
+                "()",
+                "$var",
+                "$CONST",
+            }
+        }
+        parse_operator<Operator> {
+            ok {
+                "bor",
+                "iadd",
+                "iadd_imm",
+                "iconst",
+                "imul",
+                "imul_imm",
+                "ishl",
+                "sdiv",
+                "sdiv_imm",
+                "sshr",
+            }
+            err {
+                "",
+                "iadd.i32",
+                "iadd{i32}",
+            }
+        }
+        parse_optimization<Optimization> {
+            ok {
+                "(=> (when (iadd $x $C) (is-power-of-two $C) (is-power-of-two $C)) (iadd $C $x))",
+                "(=> (when (iadd $x $C)) (iadd $C $x))",
+                "(=> (iadd $x $C) (iadd $C $x))",
+            }
+            err {
+                "",
+                "()",
+                "(=>)",
+                "(=> () ())",
+            }
+        }
+        parse_optimizations<Optimizations> {
+            ok {
+                "",
+                r#"
+                ;; Canonicalize `a + (b + c)` into `(a + b) + c`.
+                (=> (iadd $a (iadd $b $c))
+                    (iadd (iadd $a $b) $c))
+
+                ;; Combine a `const` and an `iadd` into a `iadd_imm`.
+                (=> (iadd (iconst $C) $x)
+                    (iadd_imm $C $x))
+
+                ;; When `C` is a power of two, replace `x * C` with `x << log2(C)`.
+                (=> (when (imul $x $C)
+                          (is-power-of-two $C))
+                    (ishl $x $(log2 $C)))
+                "#,
+            }
+        }
+        parse_pattern<Pattern> {
+            ok {
+                "1234",
+                "$C",
+                "$x",
+                "(iadd $x $y)",
+            }
+            err {
+                "",
+                "()",
+                "abc",
+            }
+        }
+        parse_precondition<Precondition> {
+            ok {
+                "(is-power-of-two)",
+                "(is-power-of-two $C)",
+                "(is-power-of-two $C1 $C2)",
+            }
+            err {
+                "",
+                "1234",
+                "()",
+                "$var",
+                "$CONST",
+            }
+        }
+        parse_rhs<Rhs> {
+            ok {
+                "5",
+                "$C",
+                "$x",
+                "$(log2 $C)",
+                "(iadd $x 1)",
+            }
+            err {
+                "",
+                "()",
+            }
+        }
+        parse_unquote<Unquote> {
+            ok {
+                "$(log2)",
+                "$(log2 $C)",
+                "$(log2 $C1 1)",
+                "$(neg)",
+                "$(neg $C)",
+                "$(neg $C 1)",
+            }
+            err {
+                "",
+                "(log2 $C)",
+                "$()",
+            }
+        }
+        parse_value_literal<ValueLiteral> {
+            ok {
+                "12345",
+                "true",
+            }
+            err {
+                "",
+                "'c'",
+                "\"hello\"",
+                "12.34",
+            }
+        }
+        parse_variable<Variable> {
+            ok {
+                "$v",
+                "$v1",
+                "$v2",
+                "$x",
+                "$y",
+                "$some-var",
+                "$another_var",
+            }
+            err {
+                "zzz",
+                "$",
+                "$CONSTANT",
+                "$fooBar",
+            }
+        }
+    }
+}
diff --git a/cranelift/peepmatic/src/traversals.rs b/cranelift/peepmatic/src/traversals.rs
new file mode 100644
index 0000000000..5eb4101c37
--- /dev/null
+++ b/cranelift/peepmatic/src/traversals.rs
@@ -0,0 +1,278 @@
+//! Traversals over the AST.
+
+use crate::ast::*;
+
+/// A low-level DFS traversal event: either entering or exiting the traversal of
+/// an AST node.
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
+pub enum TraversalEvent {
+    /// Entering traversal of an AST node.
+    ///
+    /// Processing an AST node upon this event corresponds to a pre-order
+    /// DFS traversal.
+    Enter,
+
+    /// Exiting traversal of an AST node.
+    ///
+    /// Processing an AST node upon this event corresponds to a post-order DFS
+    /// traversal.
+    Exit,
+}
+
+/// A depth-first traversal of an AST.
+///
+/// This is a fairly low-level traversal type, and is intended to be used as a
+/// building block for making specific pre-order or post-order traversals for
+/// whatever problem is at hand.
+///
+/// This implementation is not recursive, and exposes an `Iterator` interface
+/// that yields pairs of `(TraversalEvent, DynAstRef)` items.
+///
+/// The traversal can walk a whole set of `Optimization`s or just a subtree of
+/// the AST, because the `new` constructor takes anything that can convert into
+/// a `DynAstRef`.
+#[derive(Debug, Clone)]
+pub struct Dfs<'a> {
+    stack: Vec<(TraversalEvent, DynAstRef<'a>)>,
+}
+
+impl<'a> Dfs<'a> {
+    /// Construct a new `Dfs` traversal starting at the given `start` AST node.
+    pub fn new(start: impl Into<DynAstRef<'a>>) -> Self {
+        let start = start.into();
+        Dfs {
+            stack: vec![
+                (TraversalEvent::Exit, start),
+                (TraversalEvent::Enter, start),
+            ],
+        }
+    }
+
+    /// Peek at the next traversal event and AST node pair, if any.
+    pub fn peek(&self) -> Option<(TraversalEvent, DynAstRef<'a>)> {
+        self.stack.last().cloned()
+    }
+}
+
+impl<'a> Iterator for Dfs<'a> {
+    type Item = (TraversalEvent, DynAstRef<'a>);
+
+    fn next(&mut self) -> Option<(TraversalEvent, DynAstRef<'a>)> {
+        let (event, node) = self.stack.pop()?;
+        if let TraversalEvent::Enter = event {
+            let mut enqueue_children = EnqueueChildren(self);
+            node.child_nodes(&mut enqueue_children)
+        }
+        return Some((event, node));
+
+        struct EnqueueChildren<'a, 'b>(&'b mut Dfs<'a>)
+        where
+            'a: 'b;
+
+        impl<'a, 'b> Extend<DynAstRef<'a>> for EnqueueChildren<'a, 'b>
+        where
+            'a: 'b,
+        {
+            fn extend<T: IntoIterator<Item = DynAstRef<'a>>>(&mut self, iter: T) {
+                let iter = iter.into_iter();
+
+                let (min, max) = iter.size_hint();
+                self.0.stack.reserve(max.unwrap_or(min) * 2);
+
+                let start = self.0.stack.len();
+
+                for node in iter {
+                    self.0.stack.push((TraversalEvent::Enter, node));
+                    self.0.stack.push((TraversalEvent::Exit, node));
+                }
+
+                // Reverse to make it so that we visit children in order
+                // (e.g. operands are visited in order).
+                self.0.stack[start..].reverse();
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use DynAstRef::*;
+
+    #[test]
+    fn test_dfs_traversal() {
+        let input = "
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $(log2 $C)))
+";
+        let buf = wast::parser::ParseBuffer::new(input).expect("input should lex OK");
+        let ast = match wast::parser::parse::<crate::ast::Optimizations>(&buf) {
+            Ok(ast) => ast,
+            Err(e) => panic!("expected to parse OK, got error:\n\n{}", e),
+        };
+
+        let mut dfs = Dfs::new(&ast);
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Optimizations(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Optimization(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Lhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, PatternOperation(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Variable(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Variable(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, PatternOperation(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Pattern(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Precondition(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, ConstraintOperand(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, ConstraintOperand(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Precondition(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Lhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, RhsOperation(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Variable(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Variable(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Unquote(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Enter, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Constant(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Unquote(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, RhsOperation(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Rhs(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Optimization(..)))
+        ));
+        assert!(matches!(
+            dbg!(dfs.next()),
+            Some((TraversalEvent::Exit, Optimizations(..)))
+        ));
+        assert!(dfs.next().is_none());
+    }
+}
diff --git a/cranelift/peepmatic/src/verify.rs b/cranelift/peepmatic/src/verify.rs
new file mode 100644
index 0000000000..03865458ca
--- /dev/null
+++ b/cranelift/peepmatic/src/verify.rs
@@ -0,0 +1,1433 @@
+//! Verification and type checking of optimizations.
+//!
+//! For type checking, we compile the AST's type constraints down into Z3
+//! variables and assertions. If Z3 finds the assertions satisfiable, then we're
+//! done! If it finds them unsatisfiable, we use the `get_unsat_core` method to
+//! get the minimal subset of assertions that are in conflict, and report a
+//! best-effort type error message with them. These messages aren't perfect, but
+//! they're Good Enough when embedded in the source text via our tracking of
+//! `wast::Span`s.
+//!
+//! Verifying that there aren't any counter-examples (inputs for which the LHS
+//! and RHS produce different results) for a particular optimization is not
+//! implemented yet.
+
+use crate::ast::{Span as _, *};
+use crate::traversals::{Dfs, TraversalEvent};
+use peepmatic_runtime::{
+    operator::{Operator, TypingContext as TypingContextTrait},
+    r#type::{BitWidth, Kind, Type},
+};
+use std::borrow::Cow;
+use std::collections::HashMap;
+use std::convert::{TryFrom, TryInto};
+use std::fmt;
+use std::hash::Hash;
+use std::iter;
+use std::mem;
+use std::ops::{Deref, DerefMut};
+use std::path::Path;
+use wast::{Error as WastError, Id, Span};
+use z3::ast::Ast;
+
+/// A verification or type checking error.
+#[derive(Debug)]
+pub struct VerifyError {
+    errors: Vec<anyhow::Error>,
+}
+
+impl fmt::Display for VerifyError {
+    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+        for e in &self.errors {
+            writeln!(f, "{}\n", e)?;
+        }
+        Ok(())
+    }
+}
+
+impl std::error::Error for VerifyError {}
+
+impl From<WastError> for VerifyError {
+    fn from(e: WastError) -> Self {
+        VerifyError {
+            errors: vec![e.into()],
+        }
+    }
+}
+
+impl From<anyhow::Error> for VerifyError {
+    fn from(e: anyhow::Error) -> Self {
+        VerifyError { errors: vec![e] }
+    }
+}
+
+impl VerifyError {
+    /// To provide a more useful error this function can be used to extract
+    /// relevant textual information about this error into the error itself.
+    ///
+    /// The `contents` here should be the full text of the original file being
+    /// parsed, and this will extract a sub-slice as necessary to render in the
+    /// `Display` implementation later on.
+    pub fn set_text(&mut self, contents: &str) {
+        for e in &mut self.errors {
+            if let Some(e) = e.downcast_mut::<WastError>() {
+                e.set_text(contents);
+            }
+        }
+    }
+
+    /// To provide a more useful error this function can be used to set
+    /// the file name that this error is associated with.
+    ///
+    /// The `path` here will be stored in this error and later rendered in the
+    /// `Display` implementation.
+    pub fn set_path(&mut self, path: &Path) {
+        for e in &mut self.errors {
+            if let Some(e) = e.downcast_mut::<WastError>() {
+                e.set_path(path);
+            }
+        }
+    }
+}
+
+/// Either `Ok(T)` or `Err(VerifyError)`.
+pub type VerifyResult<T> = Result<T, VerifyError>;
+
+/// Verify and type check a set of optimizations.
+pub fn verify(opts: &Optimizations) -> VerifyResult<()> {
+    if opts.optimizations.is_empty() {
+        return Err(anyhow::anyhow!("no optimizations").into());
+    }
+
+    verify_unique_left_hand_sides(opts)?;
+
+    let z3 = &z3::Context::new(&z3::Config::new());
+    for opt in &opts.optimizations {
+        verify_optimization(z3, opt)?;
+    }
+    Ok(())
+}
+
+/// Check that every LHS in the given optimizations is unique.
+///
+/// If there were duplicates, then it would be nondeterministic which one we
+/// applied and would make automata construction more difficult. It is better to
+/// check for duplicates and reject them if found.
+fn verify_unique_left_hand_sides(opts: &Optimizations) -> VerifyResult<()> {
+    let mut lefts = HashMap::new();
+    for opt in &opts.optimizations {
+        let canon_lhs = canonicalized_lhs_key(&opt.lhs);
+        let existing = lefts.insert(canon_lhs, opt.lhs.span());
+        if let Some(span) = existing {
+            return Err(VerifyError {
+                errors: vec![
+                    anyhow::anyhow!("error: two optimizations cannot have the same left-hand side"),
+                    WastError::new(span, "note: first use of this left-hand side".into()).into(),
+                    WastError::new(
+                        opt.lhs.span(),
+                        "note: second use of this left-hand side".into(),
+                    )
+                    .into(),
+                ],
+            });
+        }
+    }
+    Ok(())
+}
+
+/// When checking for duplicate left-hand sides, we need to consider patterns
+/// that are duplicates up to renaming identifiers. For example, these LHSes
+/// should be considered duplicates of each other:
+///
+/// ```lisp
+/// (=> (iadd $x $y) ...)
+/// (=> (iadd $a $b) ...)
+/// ```
+///
+/// This function creates an opaque, canonicalized hash key for left-hand sides
+/// that sees through identifier renaming.
+fn canonicalized_lhs_key(lhs: &Lhs) -> impl Hash + Eq {
+    let mut var_to_canon = HashMap::new();
+    let mut const_to_canon = HashMap::new();
+    let mut canonicalized = vec![];
+
+    for (event, ast) in Dfs::new(lhs) {
+        if event != TraversalEvent::Enter {
+            continue;
+        }
+        use CanonicalBit::*;
+        canonicalized.push(match ast {
+            DynAstRef::Lhs(_) => Other("Lhs"),
+            DynAstRef::Pattern(_) => Other("Pattern"),
+            DynAstRef::ValueLiteral(_) => Other("ValueLiteral"),
+            DynAstRef::Integer(i) => Integer(i.value),
+            DynAstRef::Boolean(b) => Boolean(b.value),
+            DynAstRef::ConditionCode(cc) => ConditionCode(cc.cc),
+            DynAstRef::PatternOperation(o) => Operation(o.operator, o.r#type.get()),
+            DynAstRef::Precondition(p) => Precondition(p.constraint),
+            DynAstRef::ConstraintOperand(_) => Other("ConstraintOperand"),
+            DynAstRef::Variable(Variable { id, .. }) => {
+                let new_id = var_to_canon.len() as u32;
+                let canon_id = var_to_canon.entry(id).or_insert(new_id);
+                Var(*canon_id)
+            }
+            DynAstRef::Constant(Constant { id, .. }) => {
+                let new_id = const_to_canon.len() as u32;
+                let canon_id = const_to_canon.entry(id).or_insert(new_id);
+                Const(*canon_id)
+            }
+            other => unreachable!("unreachable ast node: {:?}", other),
+        });
+    }
+
+    return canonicalized;
+
+    #[derive(Hash, PartialEq, Eq)]
+    enum CanonicalBit {
+        Var(u32),
+        Const(u32),
+        Integer(i64),
+        Boolean(bool),
+        ConditionCode(peepmatic_runtime::cc::ConditionCode),
+        Operation(Operator, Option<Type>),
+        Precondition(Constraint),
+        Other(&'static str),
+    }
+}
+
+pub(crate) struct TypingContext<'a> {
+    z3: &'a z3::Context,
+    type_kind_sort: z3::DatatypeSort<'a>,
+    solver: z3::Solver<'a>,
+
+    // The type of the root of the optimization. Initialized when collecting
+    // type constraints.
+    root_ty: Option<TypeVar<'a>>,
+
+    // See the comments above `enter_operation_scope`.
+    operation_scope: HashMap<&'static str, TypeVar<'a>>,
+
+    // A map from identifiers to the type variable describing its type.
+    id_to_type_var: HashMap<Id<'a>, TypeVar<'a>>,
+
+    // A list of type constraints, the span of the AST node where the constraint
+    // originates from, and an optional message to be displayed if the
+    // constraint is not satisfied.
+    constraints: Vec<(z3::ast::Bool<'a>, Span, Option<Cow<'static, str>>)>,
+
+    // Keep track of AST nodes that need to have their types assigned to
+    // them. For these AST nodes, we know what bit width to use when
+    // interpreting peephole optimization actions.
+    boolean_literals: Vec<(&'a Boolean<'a>, TypeVar<'a>)>,
+    integer_literals: Vec<(&'a Integer<'a>, TypeVar<'a>)>,
+    rhs_operations: Vec<(&'a Operation<'a, Rhs<'a>>, TypeVar<'a>)>,
+}
+
+impl<'a> TypingContext<'a> {
+    fn new(z3: &'a z3::Context) -> Self {
+        let type_kind_sort = z3::DatatypeBuilder::new(z3)
+            .variant("int", &[])
+            .variant("bool", &[])
+            .variant("cpu_flags", &[])
+            .variant("cc", &[])
+            .variant("void", &[])
+            .finish("TypeKind");
+        TypingContext {
+            z3,
+            solver: z3::Solver::new(z3),
+            root_ty: None,
+            operation_scope: Default::default(),
+            id_to_type_var: Default::default(),
+            type_kind_sort,
+            constraints: vec![],
+            boolean_literals: Default::default(),
+            integer_literals: Default::default(),
+            rhs_operations: Default::default(),
+        }
+    }
+
+    fn init_root_type(&mut self, span: Span, root_ty: TypeVar<'a>) {
+        assert!(self.root_ty.is_none());
+
+        // Make sure the root is a valid kind, i.e. not a condition code.
+        let is_int = self.is_int(&root_ty);
+        let is_bool = self.is_bool(&root_ty);
+        let is_void = self.is_void(&root_ty);
+        let is_cpu_flags = self.is_cpu_flags(&root_ty);
+        self.constraints.push((
+            is_int.or(&[&is_bool, &is_void, &is_cpu_flags]),
+            span,
+            Some(
+                "the root of an optimization must be an integer, a boolean, void, or CPU flags"
+                    .into(),
+            ),
+        ));
+
+        self.root_ty = Some(root_ty);
+    }
+
+    fn new_type_var(&self) -> TypeVar<'a> {
+        let kind =
+            z3::ast::Datatype::fresh_const(self.z3, "type-var-kind", &self.type_kind_sort.sort);
+        let width = z3::ast::BV::fresh_const(self.z3, "type-var-width", 8);
+        TypeVar { kind, width }
+    }
+
+    fn get_or_create_type_var_for_id(&mut self, id: Id<'a>) -> TypeVar<'a> {
+        if let Some(ty) = self.id_to_type_var.get(&id) {
+            ty.clone()
+        } else {
+            // Note: can't use the entry API because we reborrow `self` here.
+            let ty = self.new_type_var();
+            self.id_to_type_var.insert(id, ty.clone());
+            ty
+        }
+    }
+
+    fn get_type_var_for_id(&mut self, id: Id<'a>) -> VerifyResult<TypeVar<'a>> {
+        if let Some(ty) = self.id_to_type_var.get(&id) {
+            Ok(ty.clone())
+        } else {
+            Err(WastError::new(id.span(), format!("unknown identifier: ${}", id.name())).into())
+        }
+    }
+
+    // The `#[peepmatic]` macro for operations allows defining operations' types
+    // like `(iNN, iNN) -> iNN` where `iNN` all refer to the same integer type
+    // variable that must have the same bit width. But other operations might
+    // *also* have that type signature but be instantiated at a different bit
+    // width. We don't want to mix up which `iNN` variables are and aren't the
+    // same. We use this method to track scopes within which all uses of `iNN`
+    // and similar refer to the same type variables.
+    fn enter_operation_scope<'b>(
+        &'b mut self,
+    ) -> impl DerefMut<Target = TypingContext<'a>> + Drop + 'b {
+        assert!(self.operation_scope.is_empty());
+        return Scope(self);
+
+        struct Scope<'a, 'b>(&'b mut TypingContext<'a>)
+        where
+            'a: 'b;
+
+        impl<'a, 'b> Deref for Scope<'a, 'b>
+        where
+            'a: 'b,
+        {
+            type Target = TypingContext<'a>;
+            fn deref(&self) -> &TypingContext<'a> {
+                self.0
+            }
+        }
+
+        impl<'a, 'b> DerefMut for Scope<'a, 'b>
+        where
+            'a: 'b,
+        {
+            fn deref_mut(&mut self) -> &mut TypingContext<'a> {
+                self.0
+            }
+        }
+
+        impl Drop for Scope<'_, '_> {
+            fn drop(&mut self) {
+                self.0.operation_scope.clear();
+            }
+        }
+    }
+
+    fn remember_boolean_literal(&mut self, b: &'a Boolean<'a>, ty: TypeVar<'a>) {
+        self.assert_is_bool(b.span, &ty);
+        self.boolean_literals.push((b, ty));
+    }
+
+    fn remember_integer_literal(&mut self, i: &'a Integer<'a>, ty: TypeVar<'a>) {
+        self.assert_is_integer(i.span, &ty);
+        self.integer_literals.push((i, ty));
+    }
+
+    fn remember_rhs_operation(&mut self, op: &'a Operation<'a, Rhs<'a>>, ty: TypeVar<'a>) {
+        self.rhs_operations.push((op, ty));
+    }
+
+    fn is_int(&self, ty: &TypeVar<'a>) -> z3::ast::Bool<'a> {
+        self.type_kind_sort.variants[0]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap()
+    }
+
+    fn is_bool(&self, ty: &TypeVar<'a>) -> z3::ast::Bool<'a> {
+        self.type_kind_sort.variants[1]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap()
+    }
+
+    fn is_cpu_flags(&self, ty: &TypeVar<'a>) -> z3::ast::Bool<'a> {
+        self.type_kind_sort.variants[2]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap()
+    }
+
+    fn is_condition_code(&self, ty: &TypeVar<'a>) -> z3::ast::Bool<'a> {
+        self.type_kind_sort.variants[3]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap()
+    }
+
+    fn is_void(&self, ty: &TypeVar<'a>) -> z3::ast::Bool<'a> {
+        self.type_kind_sort.variants[4]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap()
+    }
+
+    fn assert_is_integer(&mut self, span: Span, ty: &TypeVar<'a>) {
+        self.constraints.push((
+            self.is_int(ty),
+            span,
+            Some("type error: expected integer".into()),
+        ));
+    }
+
+    fn assert_is_bool(&mut self, span: Span, ty: &TypeVar<'a>) {
+        self.constraints.push((
+            self.is_bool(ty),
+            span,
+            Some("type error: expected bool".into()),
+        ));
+    }
+
+    fn assert_is_cpu_flags(&mut self, span: Span, ty: &TypeVar<'a>) {
+        self.constraints.push((
+            self.is_cpu_flags(ty),
+            span,
+            Some("type error: expected CPU flags".into()),
+        ));
+    }
+
+    fn assert_is_cc(&mut self, span: Span, ty: &TypeVar<'a>) {
+        self.constraints.push((
+            self.is_condition_code(ty),
+            span,
+            Some("type error: expected condition code".into()),
+        ));
+    }
+
+    fn assert_is_void(&mut self, span: Span, ty: &TypeVar<'a>) {
+        self.constraints.push((
+            self.is_void(ty),
+            span,
+            Some("type error: expected void".into()),
+        ));
+    }
+
+    fn assert_bit_width(&mut self, span: Span, ty: &TypeVar<'a>, width: u8) {
+        debug_assert!(width == 0 || width.is_power_of_two());
+        let width_var = z3::ast::BV::from_i64(self.z3, width as i64, 8);
+        let is_width = width_var._eq(&ty.width);
+        self.constraints.push((
+            is_width,
+            span,
+            Some(format!("type error: expected bit width = {}", width).into()),
+        ));
+    }
+
+    fn assert_bit_width_lt(&mut self, span: Span, a: &TypeVar<'a>, b: &TypeVar<'a>) {
+        self.constraints.push((
+            a.width.bvult(&b.width),
+            span,
+            Some("type error: expected narrower bit width".into()),
+        ));
+    }
+
+    fn assert_bit_width_gt(&mut self, span: Span, a: &TypeVar<'a>, b: &TypeVar<'a>) {
+        self.constraints.push((
+            a.width.bvugt(&b.width),
+            span,
+            Some("type error: expected wider bit width".into()),
+        ));
+    }
+
+    fn assert_type_eq(
+        &mut self,
+        span: Span,
+        lhs: &TypeVar<'a>,
+        rhs: &TypeVar<'a>,
+        msg: Option<Cow<'static, str>>,
+    ) {
+        self.constraints
+            .push((lhs.kind._eq(&rhs.kind), span, msg.clone()));
+        self.constraints
+            .push((lhs.width._eq(&rhs.width), span, msg));
+    }
+
+    fn type_check(&self, span: Span) -> VerifyResult<()> {
+        let trackers = iter::repeat_with(|| z3::ast::Bool::fresh_const(self.z3, "type-constraint"))
+            .take(self.constraints.len())
+            .collect::<Vec<_>>();
+
+        let mut tracker_to_diagnostics = HashMap::with_capacity(self.constraints.len());
+
+        for (constraint_data, tracker) in self.constraints.iter().zip(trackers) {
+            let (constraint, span, msg) = constraint_data;
+            self.solver.assert_and_track(constraint, &tracker);
+            tracker_to_diagnostics.insert(tracker, (*span, msg.clone()));
+        }
+
+        match self.solver.check() {
+            z3::SatResult::Sat => Ok(()),
+            z3::SatResult::Unsat => {
+                let core = self.solver.get_unsat_core();
+                if core.is_empty() {
+                    return Err(WastError::new(
+                        span,
+                        "z3 determined the type constraints for this optimization are \
+                         unsatisfiable, meaning there is a type error, but z3 did not give us any \
+                         additional information"
+                            .into(),
+                    )
+                    .into());
+                }
+
+                let mut errors = core
+                    .iter()
+                    .map(|tracker| {
+                        let (span, msg) = &tracker_to_diagnostics[tracker];
+                        (
+                            *span,
+                            WastError::new(
+                                *span,
+                                msg.clone().unwrap_or("type error".into()).into(),
+                            )
+                            .into(),
+                        )
+                    })
+                    .collect::<Vec<_>>();
+                errors.sort_by_key(|(span, _)| *span);
+                let errors = errors.into_iter().map(|(_, e)| e).collect();
+
+                Err(VerifyError { errors })
+            }
+            z3::SatResult::Unknown => Err(anyhow::anyhow!(
+                "z3 returned 'unknown' when evaluating type constraints: {}",
+                self.solver
+                    .get_reason_unknown()
+                    .unwrap_or_else(|| "<no reason given>".into())
+            )
+            .into()),
+        }
+    }
+
+    fn assign_types(&mut self) -> VerifyResult<()> {
+        for (int, ty) in mem::replace(&mut self.integer_literals, vec![]) {
+            let width = self.ty_var_to_width(&ty)?;
+            int.bit_width.set(Some(width));
+        }
+
+        for (b, ty) in mem::replace(&mut self.boolean_literals, vec![]) {
+            let width = self.ty_var_to_width(&ty)?;
+            b.bit_width.set(Some(width));
+        }
+
+        for (op, ty) in mem::replace(&mut self.rhs_operations, vec![]) {
+            let kind = self.op_ty_var_to_kind(&ty);
+            let bit_width = match kind {
+                Kind::CpuFlags | Kind::Void => BitWidth::One,
+                Kind::Int | Kind::Bool => self.ty_var_to_width(&ty)?,
+            };
+            debug_assert!(op.r#type.get().is_none());
+            op.r#type.set(Some(Type { kind, bit_width }));
+        }
+
+        Ok(())
+    }
+
+    fn ty_var_to_width(&self, ty_var: &TypeVar<'a>) -> VerifyResult<BitWidth> {
+        // Doing solver push/pops apparently clears out the model, so we have to
+        // re-check each time to ensure that it exists, and Z3 doesn't helpfully
+        // abort the process for us. This should be fast, since the solver
+        // remembers inferences from earlier checks.
+        assert_eq!(self.solver.check(), z3::SatResult::Sat);
+
+        // Check if there is more than one satisfying assignment to
+        // `ty_var`'s width variable. If so, then it must be polymorphic. If
+        // not, then it must have a fixed value.
+        let model = self.solver.get_model();
+        let width_var = model.eval(&ty_var.width).unwrap();
+        let bit_width: u8 = width_var.as_u64().unwrap().try_into().unwrap();
+
+        self.solver.push();
+        self.solver.assert(&ty_var.width._eq(&width_var).not());
+        let is_polymorphic = match self.solver.check() {
+            z3::SatResult::Sat => true,
+            z3::SatResult::Unsat => false,
+            z3::SatResult::Unknown => panic!("Z3 cannot determine bit width of type"),
+        };
+        self.solver.pop(1);
+
+        if is_polymorphic {
+            // If something is polymorphic over bit widths, it must be
+            // polymorphic over the same bit width as the whole
+            // optimization.
+            //
+            // TODO: We should have a better model for bit-width
+            // polymorphism. The current setup works for all the use cases we
+            // currently care about, and is relatively easy to implement when
+            // matching and constructing the RHS, but is a bit ad-hoc. Maybe
+            // allow each LHS variable a polymorphic bit width, augment the AST
+            // with that info, and later emit match ops as necessary to express
+            // their relative constraints? *hand waves*
+            self.solver.push();
+            self.solver
+                .assert(&ty_var.width._eq(&self.root_ty.as_ref().unwrap().width));
+            match self.solver.check() {
+                z3::SatResult::Sat => {}
+                z3::SatResult::Unsat => {
+                    return Err(anyhow::anyhow!(
+                        "AST node is bit width polymorphic, but not over the optimization's root \
+                         width"
+                    )
+                    .into())
+                }
+                z3::SatResult::Unknown => panic!("Z3 cannot determine bit width of type"),
+            };
+            self.solver.pop(1);
+
+            Ok(BitWidth::Polymorphic)
+        } else {
+            Ok(BitWidth::try_from(bit_width).unwrap())
+        }
+    }
+
+    fn op_ty_var_to_kind(&self, ty_var: &TypeVar<'a>) -> Kind {
+        for (predicate, kind) in [
+            (Self::is_int as fn(_, _) -> _, Kind::Int),
+            (Self::is_bool, Kind::Bool),
+            (Self::is_cpu_flags, Kind::CpuFlags),
+            (Self::is_void, Kind::Void),
+        ]
+        .iter()
+        {
+            self.solver.push();
+            self.solver.assert(&predicate(self, ty_var));
+            match self.solver.check() {
+                z3::SatResult::Sat => {
+                    self.solver.pop(1);
+                    return *kind;
+                }
+                z3::SatResult::Unsat => {
+                    self.solver.pop(1);
+                    continue;
+                }
+                z3::SatResult::Unknown => panic!("Z3 cannot determine the type's kind"),
+            }
+        }
+
+        // This would only happen if given a `TypeVar` whose kind was a
+        // condition code, but we only use this function for RHS operations,
+        // which cannot be condition codes.
+        panic!("cannot convert type variable's kind to `peepmatic_runtime::type::Kind`")
+    }
+}
+
+impl<'a> TypingContextTrait<'a> for TypingContext<'a> {
+    type TypeVariable = TypeVar<'a>;
+
+    fn cc(&mut self, span: Span) -> TypeVar<'a> {
+        let ty = self.new_type_var();
+        self.assert_is_cc(span, &ty);
+        ty
+    }
+
+    fn bNN(&mut self, span: Span) -> TypeVar<'a> {
+        if let Some(ty) = self.operation_scope.get("bNN") {
+            return ty.clone();
+        }
+
+        let ty = self.new_type_var();
+        self.assert_is_bool(span, &ty);
+        self.operation_scope.insert("bNN", ty.clone());
+        ty
+    }
+
+    fn iNN(&mut self, span: Span) -> TypeVar<'a> {
+        if let Some(ty) = self.operation_scope.get("iNN") {
+            return ty.clone();
+        }
+
+        let ty = self.new_type_var();
+        self.assert_is_integer(span, &ty);
+        self.operation_scope.insert("iNN", ty.clone());
+        ty
+    }
+
+    fn iMM(&mut self, span: Span) -> TypeVar<'a> {
+        if let Some(ty) = self.operation_scope.get("iMM") {
+            return ty.clone();
+        }
+
+        let ty = self.new_type_var();
+        self.assert_is_integer(span, &ty);
+        self.operation_scope.insert("iMM", ty.clone());
+        ty
+    }
+
+    fn cpu_flags(&mut self, span: Span) -> TypeVar<'a> {
+        if let Some(ty) = self.operation_scope.get("cpu_flags") {
+            return ty.clone();
+        }
+
+        let ty = self.new_type_var();
+        self.assert_is_cpu_flags(span, &ty);
+        self.assert_bit_width(span, &ty, 1);
+        self.operation_scope.insert("cpu_flags", ty.clone());
+        ty
+    }
+
+    fn b1(&mut self, span: Span) -> TypeVar<'a> {
+        let b1 = self.new_type_var();
+        self.assert_is_bool(span, &b1);
+        self.assert_bit_width(span, &b1, 1);
+        b1
+    }
+
+    fn void(&mut self, span: Span) -> TypeVar<'a> {
+        let void = self.new_type_var();
+        self.assert_is_void(span, &void);
+        self.assert_bit_width(span, &void, 0);
+        void
+    }
+
+    fn bool_or_int(&mut self, span: Span) -> TypeVar<'a> {
+        let ty = self.new_type_var();
+        let is_int = self.type_kind_sort.variants[0]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap();
+        let is_bool = self.type_kind_sort.variants[1]
+            .tester
+            .apply(&[&ty.kind.clone().into()])
+            .as_bool()
+            .unwrap();
+        self.constraints.push((
+            is_int.or(&[&is_bool]),
+            span,
+            Some("type error: must be either an int or a bool type".into()),
+        ));
+        ty
+    }
+
+    fn any_t(&mut self, _span: Span) -> TypeVar<'a> {
+        if let Some(ty) = self.operation_scope.get("any_t") {
+            return ty.clone();
+        }
+
+        let ty = self.new_type_var();
+        self.operation_scope.insert("any_t", ty.clone());
+        ty
+    }
+}
+
+#[derive(Clone)]
+pub(crate) struct TypeVar<'a> {
+    kind: z3::ast::Datatype<'a>,
+    width: z3::ast::BV<'a>,
+}
+
+fn verify_optimization(z3: &z3::Context, opt: &Optimization) -> VerifyResult<()> {
+    let mut context = TypingContext::new(z3);
+    collect_type_constraints(&mut context, opt)?;
+    context.type_check(opt.span)?;
+    context.assign_types()?;
+
+    // TODO: add another pass here to check for counter-examples to this
+    // optimization, i.e. inputs where the LHS and RHS are not equivalent.
+
+    Ok(())
+}
+
+fn collect_type_constraints<'a>(
+    context: &mut TypingContext<'a>,
+    opt: &'a Optimization<'a>,
+) -> VerifyResult<()> {
+    use crate::traversals::TraversalEvent as TE;
+
+    let lhs_ty = context.new_type_var();
+    context.init_root_type(opt.lhs.span, lhs_ty.clone());
+
+    let rhs_ty = context.new_type_var();
+    context.assert_type_eq(
+        opt.span,
+        &lhs_ty,
+        &rhs_ty,
+        Some("type error: the left-hand side and right-hand side must have the same type".into()),
+    );
+
+    // A stack of type variables that we are constraining as we traverse the
+    // AST. Operations push new type variables for their operands' expected
+    // types, and exiting a `Pattern` in the traversal pops them off.
+    let mut expected_types = vec![lhs_ty];
+
+    // Build up the type constraints for the left-hand side.
+    for (event, node) in Dfs::new(&opt.lhs) {
+        match (event, node) {
+            (TE::Enter, DynAstRef::Pattern(Pattern::Constant(Constant { id, span })))
+            | (TE::Enter, DynAstRef::Pattern(Pattern::Variable(Variable { id, span }))) => {
+                let id = context.get_or_create_type_var_for_id(*id);
+                context.assert_type_eq(*span, expected_types.last().unwrap(), &id, None);
+            }
+            (TE::Enter, DynAstRef::Pattern(Pattern::ValueLiteral(ValueLiteral::Integer(i)))) => {
+                let ty = expected_types.last().unwrap();
+                context.remember_integer_literal(i, ty.clone());
+            }
+            (TE::Enter, DynAstRef::Pattern(Pattern::ValueLiteral(ValueLiteral::Boolean(b)))) => {
+                let ty = expected_types.last().unwrap();
+                context.remember_boolean_literal(b, ty.clone());
+            }
+            (
+                TE::Enter,
+                DynAstRef::Pattern(Pattern::ValueLiteral(ValueLiteral::ConditionCode(cc))),
+            ) => {
+                let ty = expected_types.last().unwrap();
+                context.assert_is_cc(cc.span, ty);
+            }
+            (TE::Enter, DynAstRef::PatternOperation(op)) => {
+                let result_ty;
+                let mut operand_types = vec![];
+                {
+                    let mut scope = context.enter_operation_scope();
+                    result_ty = op.operator.result_type(&mut *scope, op.span);
+                    op.operator
+                        .immediate_types(&mut *scope, op.span, &mut operand_types);
+                    op.operator
+                        .param_types(&mut *scope, op.span, &mut operand_types);
+                }
+
+                if op.operands.len() != operand_types.len() {
+                    return Err(WastError::new(
+                        op.span,
+                        format!(
+                            "Expected {} operands but found {}",
+                            operand_types.len(),
+                            op.operands.len()
+                        ),
+                    )
+                    .into());
+                }
+
+                for imm in op
+                    .operands
+                    .iter()
+                    .take(op.operator.immediates_arity() as usize)
+                {
+                    match imm {
+                        Pattern::ValueLiteral(_) |
+                        Pattern::Constant(_) |
+                        Pattern::Variable(_) => continue,
+                        Pattern::Operation(op) => return Err(WastError::new(
+                            op.span,
+                            "operations are invalid immediates; must be a value literal, constant, \
+                             or variable".into()
+                        ).into()),
+                    }
+                }
+
+                match op.operator {
+                    Operator::Ireduce | Operator::Uextend | Operator::Sextend => {
+                        if op.r#type.get().is_none() {
+                            return Err(WastError::new(
+                                op.span,
+                                "`ireduce`, `sextend`, and `uextend` require an ascribed type, \
+                                 like `(sextend{i64} ...)`"
+                                    .into(),
+                            )
+                            .into());
+                        }
+                    }
+                    _ => {}
+                }
+
+                match op.operator {
+                    Operator::Uextend | Operator::Sextend => {
+                        context.assert_bit_width_gt(op.span, &result_ty, &operand_types[0]);
+                    }
+                    Operator::Ireduce => {
+                        context.assert_bit_width_lt(op.span, &result_ty, &operand_types[0]);
+                    }
+                    _ => {}
+                }
+
+                if let Some(ty) = op.r#type.get() {
+                    match ty.kind {
+                        Kind::Bool => context.assert_is_bool(op.span, &result_ty),
+                        Kind::Int => context.assert_is_integer(op.span, &result_ty),
+                        Kind::Void => context.assert_is_void(op.span, &result_ty),
+                        Kind::CpuFlags => {
+                            unreachable!("no syntax for ascribing CPU flags types right now")
+                        }
+                    }
+                    if let Some(w) = ty.bit_width.fixed_width() {
+                        context.assert_bit_width(op.span, &result_ty, w);
+                    }
+                }
+
+                context.assert_type_eq(op.span, expected_types.last().unwrap(), &result_ty, None);
+
+                operand_types.reverse();
+                expected_types.extend(operand_types);
+            }
+            (TE::Exit, DynAstRef::Pattern(..)) => {
+                expected_types.pop().unwrap();
+            }
+            (TE::Enter, DynAstRef::Precondition(pre)) => {
+                type_constrain_precondition(context, pre)?;
+            }
+            _ => continue,
+        }
+    }
+
+    // We should have exited exactly as many patterns as we entered: one for the
+    // root pattern and the initial `lhs_ty`, and then the rest for the operands
+    // of pattern operations.
+    assert!(expected_types.is_empty());
+
+    // Collect the type constraints for the right-hand side.
+    expected_types.push(rhs_ty);
+    for (event, node) in Dfs::new(&opt.rhs) {
+        match (event, node) {
+            (TE::Enter, DynAstRef::Rhs(Rhs::ValueLiteral(ValueLiteral::Integer(i)))) => {
+                let ty = expected_types.last().unwrap();
+                context.remember_integer_literal(i, ty.clone());
+            }
+            (TE::Enter, DynAstRef::Rhs(Rhs::ValueLiteral(ValueLiteral::Boolean(b)))) => {
+                let ty = expected_types.last().unwrap();
+                context.remember_boolean_literal(b, ty.clone());
+            }
+            (TE::Enter, DynAstRef::Rhs(Rhs::ValueLiteral(ValueLiteral::ConditionCode(cc)))) => {
+                let ty = expected_types.last().unwrap();
+                context.assert_is_cc(cc.span, ty);
+            }
+            (TE::Enter, DynAstRef::Rhs(Rhs::Constant(Constant { span, id })))
+            | (TE::Enter, DynAstRef::Rhs(Rhs::Variable(Variable { span, id }))) => {
+                let id_ty = context.get_type_var_for_id(*id)?;
+                context.assert_type_eq(*span, expected_types.last().unwrap(), &id_ty, None);
+            }
+            (TE::Enter, DynAstRef::RhsOperation(op)) => {
+                let result_ty;
+                let mut operand_types = vec![];
+                {
+                    let mut scope = context.enter_operation_scope();
+                    result_ty = op.operator.result_type(&mut *scope, op.span);
+                    op.operator
+                        .immediate_types(&mut *scope, op.span, &mut operand_types);
+                    op.operator
+                        .param_types(&mut *scope, op.span, &mut operand_types);
+                }
+
+                if op.operands.len() != operand_types.len() {
+                    return Err(WastError::new(
+                        op.span,
+                        format!(
+                            "Expected {} operands but found {}",
+                            operand_types.len(),
+                            op.operands.len()
+                        ),
+                    )
+                    .into());
+                }
+
+                for imm in op
+                    .operands
+                    .iter()
+                    .take(op.operator.immediates_arity() as usize)
+                {
+                    match imm {
+                        Rhs::ValueLiteral(_)
+                        | Rhs::Constant(_)
+                        | Rhs::Variable(_)
+                        | Rhs::Unquote(_) => continue,
+                        Rhs::Operation(op) => return Err(WastError::new(
+                            op.span,
+                            "operations are invalid immediates; must be a value literal, unquote, \
+                             constant, or variable"
+                                .into(),
+                        )
+                        .into()),
+                    }
+                }
+
+                match op.operator {
+                    Operator::Ireduce | Operator::Uextend | Operator::Sextend => {
+                        if op.r#type.get().is_none() {
+                            return Err(WastError::new(
+                                op.span,
+                                "`ireduce`, `sextend`, and `uextend` require an ascribed type, \
+                                 like `(sextend{i64} ...)`"
+                                    .into(),
+                            )
+                            .into());
+                        }
+                    }
+                    _ => {}
+                }
+
+                match op.operator {
+                    Operator::Uextend | Operator::Sextend => {
+                        context.assert_bit_width_gt(op.span, &result_ty, &operand_types[0]);
+                    }
+                    Operator::Ireduce => {
+                        context.assert_bit_width_lt(op.span, &result_ty, &operand_types[0]);
+                    }
+                    _ => {}
+                }
+
+                if let Some(ty) = op.r#type.get() {
+                    match ty.kind {
+                        Kind::Bool => context.assert_is_bool(op.span, &result_ty),
+                        Kind::Int => context.assert_is_integer(op.span, &result_ty),
+                        Kind::Void => context.assert_is_void(op.span, &result_ty),
+                        Kind::CpuFlags => {
+                            unreachable!("no syntax for ascribing CPU flags types right now")
+                        }
+                    }
+                    if let Some(w) = ty.bit_width.fixed_width() {
+                        context.assert_bit_width(op.span, &result_ty, w);
+                    }
+                }
+
+                context.assert_type_eq(op.span, expected_types.last().unwrap(), &result_ty, None);
+                if op.r#type.get().is_none() {
+                    context.remember_rhs_operation(op, result_ty);
+                }
+
+                operand_types.reverse();
+                expected_types.extend(operand_types);
+            }
+            (TE::Enter, DynAstRef::Unquote(unq)) => {
+                let result_ty;
+                let mut operand_types = vec![];
+                {
+                    let mut scope = context.enter_operation_scope();
+                    result_ty = unq.operator.result_type(&mut *scope, unq.span);
+                    unq.operator
+                        .immediate_types(&mut *scope, unq.span, &mut operand_types);
+                    unq.operator
+                        .param_types(&mut *scope, unq.span, &mut operand_types);
+                }
+
+                if unq.operands.len() != operand_types.len() {
+                    return Err(WastError::new(
+                        unq.span,
+                        format!(
+                            "Expected {} unquote operands but found {}",
+                            operand_types.len(),
+                            unq.operands.len()
+                        ),
+                    )
+                    .into());
+                }
+
+                for operand in &unq.operands {
+                    match operand {
+                        Rhs::ValueLiteral(_) | Rhs::Constant(_) => continue,
+                        Rhs::Variable(_) | Rhs::Unquote(_) | Rhs::Operation(_) => {
+                            return Err(WastError::new(
+                                operand.span(),
+                                "unquote operands must be value literals or constants".into(),
+                            )
+                            .into());
+                        }
+                    }
+                }
+
+                context.assert_type_eq(unq.span, expected_types.last().unwrap(), &result_ty, None);
+
+                operand_types.reverse();
+                expected_types.extend(operand_types);
+            }
+            (TE::Exit, DynAstRef::Rhs(..)) => {
+                expected_types.pop().unwrap();
+            }
+            _ => continue,
+        }
+    }
+
+    // Again, we should have popped off all the expected types when exiting
+    // `Rhs` nodes in the traversal.
+    assert!(expected_types.is_empty());
+
+    Ok(())
+}
+
+fn type_constrain_precondition<'a>(
+    context: &mut TypingContext<'a>,
+    pre: &Precondition<'a>,
+) -> VerifyResult<()> {
+    match pre.constraint {
+        Constraint::BitWidth => {
+            if pre.operands.len() != 2 {
+                return Err(WastError::new(
+                    pre.span,
+                    format!(
+                        "the `bit-width` precondition requires exactly 2 operands, found \
+                         {} operands",
+                        pre.operands.len(),
+                    ),
+                )
+                .into());
+            }
+
+            let id = match pre.operands[0] {
+                ConstraintOperand::ValueLiteral(_) => {
+                    return Err(anyhow::anyhow!(
+                        "the `bit-width` precondition requires a constant or variable as \
+                     its first operand"
+                    )
+                    .into())
+                }
+                ConstraintOperand::Constant(Constant { id, .. })
+                | ConstraintOperand::Variable(Variable { id, .. }) => id,
+            };
+
+            let width = match pre.operands[1] {
+                ConstraintOperand::ValueLiteral(ValueLiteral::Integer(Integer {
+                    value, ..
+                })) if value == 1
+                    || value == 8
+                    || value == 16
+                    || value == 32
+                    || value == 64
+                    || value == 128 =>
+                {
+                    value as u8
+                }
+                ref op => return Err(WastError::new(
+                    op.span(),
+                    "the `bit-width` precondition requires a bit width of 1, 8, 16, 32, 64, or \
+                     128"
+                    .into(),
+                )
+                .into()),
+            };
+
+            let ty = context.get_type_var_for_id(id)?;
+            context.assert_bit_width(pre.span, &ty, width);
+            Ok(())
+        }
+        Constraint::IsPowerOfTwo => {
+            if pre.operands.len() != 1 {
+                return Err(WastError::new(
+                    pre.span,
+                    format!(
+                        "the `is-power-of-two` precondition requires exactly 1 operand, found \
+                         {} operands",
+                        pre.operands.len(),
+                    ),
+                )
+                .into());
+            }
+            match &pre.operands[0] {
+                ConstraintOperand::Constant(Constant { id, .. }) => {
+                    let ty = context.get_type_var_for_id(*id)?;
+                    context.assert_is_integer(pre.span(), &ty);
+                    Ok(())
+                }
+                op => Err(WastError::new(
+                    op.span(),
+                    "`is-power-of-two` operands must be constant bindings".into(),
+                )
+                .into()),
+            }
+        }
+        Constraint::FitsInNativeWord => {
+            if pre.operands.len() != 1 {
+                return Err(WastError::new(
+                    pre.span,
+                    format!(
+                        "the `fits-in-native-word` precondition requires exactly 1 operand, found \
+                         {} operands",
+                        pre.operands.len(),
+                    ),
+                )
+                .into());
+            }
+
+            match pre.operands[0] {
+                ConstraintOperand::ValueLiteral(_) => {
+                    return Err(anyhow::anyhow!(
+                        "the `fits-in-native-word` precondition requires a constant or variable as \
+                         its first operand"
+                    )
+                    .into())
+                }
+                ConstraintOperand::Constant(Constant { id, .. })
+                | ConstraintOperand::Variable(Variable { id, .. }) => {
+                    context.get_type_var_for_id(id)?;
+                    Ok(())
+                }
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    macro_rules! verify_ok {
+        ($name:ident, $src:expr) => {
+            #[test]
+            fn $name() {
+                let buf = wast::parser::ParseBuffer::new($src).expect("should lex OK");
+                let opts = match wast::parser::parse::<Optimizations>(&buf) {
+                    Ok(opts) => opts,
+                    Err(mut e) => {
+                        e.set_path(Path::new(stringify!($name)));
+                        e.set_text($src);
+                        eprintln!("{}", e);
+                        panic!("should parse OK")
+                    }
+                };
+                match verify(&opts) {
+                    Ok(_) => return,
+                    Err(mut e) => {
+                        e.set_path(Path::new(stringify!($name)));
+                        e.set_text($src);
+                        eprintln!("{}", e);
+                        panic!("should verify OK")
+                    }
+                }
+            }
+        };
+    }
+
+    macro_rules! verify_err {
+        ($name:ident, $src:expr) => {
+            #[test]
+            fn $name() {
+                let buf = wast::parser::ParseBuffer::new($src).expect("should lex OK");
+                let opts = match wast::parser::parse::<Optimizations>(&buf) {
+                    Ok(opts) => opts,
+                    Err(mut e) => {
+                        e.set_path(Path::new(stringify!($name)));
+                        e.set_text($src);
+                        eprintln!("{}", e);
+                        panic!("should parse OK")
+                    }
+                };
+                match verify(&opts) {
+                    Ok(_) => panic!("expected a verification error, but it verified OK"),
+                    Err(mut e) => {
+                        e.set_path(Path::new(stringify!($name)));
+                        e.set_text($src);
+                        eprintln!("{}", e);
+                        return;
+                    }
+                }
+            }
+        };
+    }
+
+    verify_ok!(bool_0, "(=> true true)");
+    verify_ok!(bool_1, "(=> false false)");
+    verify_ok!(bool_2, "(=> true false)");
+    verify_ok!(bool_3, "(=> false true)");
+
+    verify_err!(bool_is_not_int_0, "(=> true 42)");
+    verify_err!(bool_is_not_int_1, "(=> 42 true)");
+
+    verify_ok!(
+        bit_width_0,
+        "
+(=> (when (iadd $x $y)
+          (bit-width $x 32)
+          (bit-width $y 32))
+    (iadd $x $y))
+"
+    );
+    verify_err!(
+        bit_width_1,
+        "
+(=> (when (iadd $x $y)
+          (bit-width $x 32)
+          (bit-width $y 64))
+    (iadd $x $y))
+"
+    );
+    verify_err!(
+        bit_width_2,
+        "
+(=> (when (iconst $C)
+          (bit-width $C))
+    5)
+"
+    );
+    verify_err!(
+        bit_width_3,
+        "
+(=> (when (iconst $C)
+          (bit-width 32 32))
+    5)
+"
+    );
+    verify_err!(
+        bit_width_4,
+        "
+(=> (when (iconst $C)
+          (bit-width $C $C))
+    5)
+"
+    );
+    verify_err!(
+        bit_width_5,
+        "
+(=> (when (iconst $C)
+          (bit-width $C2 32))
+    5)
+"
+    );
+    verify_err!(
+        bit_width_6,
+        "
+(=> (when (iconst $C)
+          (bit-width $C2 33))
+    5)
+"
+    );
+
+    verify_ok!(
+        is_power_of_two_0,
+        "
+(=> (when (imul $x $C)
+          (is-power-of-two $C))
+    (ishl $x $(log2 $C)))
+"
+    );
+    verify_err!(
+        is_power_of_two_1,
+        "
+(=> (when (imul $x $C)
+          (is-power-of-two))
+    5)
+"
+    );
+    verify_err!(
+        is_power_of_two_2,
+        "
+(=> (when (imul $x $C)
+          (is-power-of-two $C $C))
+    5)
+"
+    );
+
+    verify_ok!(pattern_ops_0, "(=> (iadd $x $C) 5)");
+    verify_err!(pattern_ops_1, "(=> (iadd $x) 5)");
+    verify_err!(pattern_ops_2, "(=> (iadd $x $y $z) 5)");
+
+    verify_ok!(unquote_0, "(=> $C $(log2 $C))");
+    verify_err!(unquote_1, "(=> (iadd $C $D) $(log2 $C $D))");
+    verify_err!(unquote_2, "(=> $x $(log2))");
+    verify_ok!(unquote_3, "(=> $C $(neg $C))");
+    verify_err!(unquote_4, "(=> $x $(neg))");
+    verify_err!(unquote_5, "(=> (iadd $x $y) $(neg $x $y))");
+    verify_err!(unquote_6, "(=> $x $(neg $x))");
+
+    verify_ok!(rhs_0, "(=> $x (iadd $x (iconst 0)))");
+    verify_err!(rhs_1, "(=> $x (iadd $x))");
+    verify_err!(rhs_2, "(=> $x (iadd $x 0 0))");
+
+    verify_err!(no_optimizations, "");
+
+    verify_err!(
+        duplicate_left_hand_sides,
+        "
+(=> (iadd $x $y) 0)
+(=> (iadd $x $y) 1)
+"
+    );
+    verify_err!(
+        canonically_duplicate_left_hand_sides_0,
+        "
+(=> (iadd $x $y) 0)
+(=> (iadd $y $x) 1)
+"
+    );
+    verify_err!(
+        canonically_duplicate_left_hand_sides_1,
+        "
+(=> (iadd $X $Y) 0)
+(=> (iadd $Y $X) 1)
+"
+    );
+    verify_err!(
+        canonically_duplicate_left_hand_sides_2,
+        "
+(=> (iadd $x $x) 0)
+(=> (iadd $y $y) 1)
+"
+    );
+
+    verify_ok!(
+        canonically_different_left_hand_sides_0,
+        "
+(=> (iadd $x $C) 0)
+(=> (iadd $C $x) 1)
+"
+    );
+    verify_ok!(
+        canonically_different_left_hand_sides_1,
+        "
+(=> (iadd $x $x) 0)
+(=> (iadd $x $y) 1)
+"
+    );
+
+    verify_ok!(
+        fits_in_native_word_0,
+        "(=> (when (iadd $x $y) (fits-in-native-word $x)) 0)"
+    );
+    verify_err!(
+        fits_in_native_word_1,
+        "(=> (when (iadd $x $y) (fits-in-native-word)) 0)"
+    );
+    verify_err!(
+        fits_in_native_word_2,
+        "(=> (when (iadd $x $y) (fits-in-native-word $x $y)) 0)"
+    );
+    verify_err!(
+        fits_in_native_word_3,
+        "(=> (when (iadd $x $y) (fits-in-native-word true)) 0)"
+    );
+
+    verify_err!(reduce_extend_0, "(=> (sextend (ireduce -1)) 0)");
+    verify_err!(reduce_extend_1, "(=> (uextend (ireduce -1)) 0)");
+    verify_ok!(reduce_extend_2, "(=> (sextend{i64} (ireduce{i32} -1)) 0)");
+    verify_ok!(reduce_extend_3, "(=> (uextend{i64} (ireduce{i32} -1)) 0)");
+    verify_err!(reduce_extend_4, "(=> (sextend{i64} (ireduce{i64} -1)) 0)");
+    verify_err!(reduce_extend_5, "(=> (uextend{i64} (ireduce{i64} -1)) 0)");
+    verify_err!(reduce_extend_6, "(=> (sextend{i32} (ireduce{i64} -1)) 0)");
+    verify_err!(reduce_extend_7, "(=> (uextend{i32} (ireduce{i64} -1)) 0)");
+
+    verify_err!(
+        using_an_operation_as_an_immediate_in_lhs,
+        "(=> (iadd_imm (imul $x $y) $z) 0)"
+    );
+    verify_err!(
+        using_an_operation_as_an_immediate_in_rhs,
+        "(=> (iadd (imul $x $y) $z) (iadd_imm (imul $x $y) $z))"
+    );
+
+    verify_err!(
+        using_a_condition_code_as_the_root_of_an_optimization,
+        "(=> eq eq)"
+    );
+}
diff --git a/fuzz/Cargo.toml b/fuzz/Cargo.toml
index 38fa092d58..f6ed67ac8e 100644
--- a/fuzz/Cargo.toml
+++ b/fuzz/Cargo.toml
@@ -14,6 +14,7 @@ cranelift-reader = { path = "../cranelift/reader" }
 cranelift-wasm = { path = "../cranelift/wasm" }
 libfuzzer-sys = "0.3.2"
 target-lexicon = "0.10"
+peepmatic-fuzzing = { path = "../cranelift/peepmatic/crates/fuzzing" }
 wasmtime = { path = "../crates/wasmtime" }
 wasmtime-fuzzing = { path = "../crates/fuzzing" }
 
@@ -56,5 +57,35 @@ path = "fuzz_targets/spectests.rs"
 test = false
 doc = false
 
+[[bin]]
+name = "peepmatic_simple_automata"
+path = "fuzz_targets/peepmatic_simple_automata.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "peepmatic_fst_differential"
+path = "fuzz_targets/peepmatic_fst_differential.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "peepmatic_parser"
+path = "fuzz_targets/peepmatic_parser.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "peepmatic_compile"
+path = "fuzz_targets/peepmatic_compile.rs"
+test = false
+doc = false
+
+[[bin]]
+name = "peepmatic_interp"
+path = "fuzz_targets/peepmatic_interp.rs"
+test = false
+doc = false
+
 [features]
 binaryen = ['wasmtime-fuzzing/binaryen']
diff --git a/fuzz/fuzz_targets/peepmatic_compile.rs b/fuzz/fuzz_targets/peepmatic_compile.rs
new file mode 100644
index 0000000000..623d747280
--- /dev/null
+++ b/fuzz/fuzz_targets/peepmatic_compile.rs
@@ -0,0 +1,8 @@
+#![no_main]
+
+use libfuzzer_sys::fuzz_target;
+use peepmatic_fuzzing::compile::compile;
+
+fuzz_target!(|data: &[u8]| {
+    compile(data);
+});
diff --git a/fuzz/fuzz_targets/peepmatic_fst_differential.rs b/fuzz/fuzz_targets/peepmatic_fst_differential.rs
new file mode 100644
index 0000000000..00549112db
--- /dev/null
+++ b/fuzz/fuzz_targets/peepmatic_fst_differential.rs
@@ -0,0 +1,8 @@
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use peepmatic_fuzzing::automata::fst_differential;
+use std::collections::HashMap;
+
+fuzz_target!(|map: HashMap<Vec<u8>, u64>| {
+    fst_differential(map);
+});
diff --git a/fuzz/fuzz_targets/peepmatic_interp.rs b/fuzz/fuzz_targets/peepmatic_interp.rs
new file mode 100644
index 0000000000..dd3c1732ab
--- /dev/null
+++ b/fuzz/fuzz_targets/peepmatic_interp.rs
@@ -0,0 +1,8 @@
+#![no_main]
+
+use libfuzzer_sys::fuzz_target;
+use peepmatic_fuzzing::interp::interp;
+
+fuzz_target!(|data: &[u8]| {
+    interp(data);
+});
diff --git a/fuzz/fuzz_targets/peepmatic_parser.rs b/fuzz/fuzz_targets/peepmatic_parser.rs
new file mode 100644
index 0000000000..5664dad41b
--- /dev/null
+++ b/fuzz/fuzz_targets/peepmatic_parser.rs
@@ -0,0 +1,8 @@
+#![no_main]
+
+use libfuzzer_sys::fuzz_target;
+use peepmatic_fuzzing::parser::parse;
+
+fuzz_target!(|data: &[u8]| {
+    parse(data);
+});
diff --git a/fuzz/fuzz_targets/peepmatic_simple_automata.rs b/fuzz/fuzz_targets/peepmatic_simple_automata.rs
new file mode 100644
index 0000000000..ecf2fd7850
--- /dev/null
+++ b/fuzz/fuzz_targets/peepmatic_simple_automata.rs
@@ -0,0 +1,7 @@
+#![no_main]
+use libfuzzer_sys::fuzz_target;
+use peepmatic_fuzzing::automata::simple_automata;
+
+fuzz_target!(|input_output_pairs: Vec<Vec<(u8, Vec<u8>)>>| {
+    simple_automata(input_output_pairs);
+});