Repository: microsoft/sca-fuzzer
Branch: main
Commit: 7cc132332d6a
Files: 378
Total size: 2.7 MB

Directory structure:
gitextract_198ykafh/

├── .editorconfig
├── .github/
│   ├── CODEOWNERS
│   └── workflows/
│       ├── kmodule-build.yaml
│       └── python-lint-and-test.yaml
├── .gitignore
├── .gitmodules
├── .pylintrc
├── AUTHORS
├── CHANGELOG.md
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── SECURITY.md
├── demo/
│   ├── README.md
│   ├── big-fuzz.yaml
│   ├── detect-foreshadow.yaml
│   ├── detect-mds.yaml
│   ├── detect-sco.yaml
│   ├── detect-v1-store.yaml
│   ├── detect-v1-var.yaml
│   ├── detect-v1.yaml
│   ├── detect-v4.yaml
│   ├── detect-zdi.yaml
│   ├── tsa-l1d/
│   │   ├── config.yaml
│   │   └── template.asm
│   └── tsa-sq/
│       ├── config.yaml
│       └── template.asm
├── docs/
│   ├── assets/
│   │   ├── branches.drawio
│   │   ├── dr-instrumentation.drawio
│   │   ├── dr-model.drawio
│   │   ├── fuzzing-flow.drawio
│   │   ├── tsa-sq-template.drawio
│   │   └── unicorn-model-state-machine.drawio
│   ├── faq/
│   │   └── general.md
│   ├── glossary.md
│   ├── howto/
│   │   ├── ask-a-question.md
│   │   ├── choose-contract.md
│   │   ├── design-campaign.md
│   │   ├── interpret-results.md
│   │   ├── minimize.md
│   │   ├── root-cause-a-violation.md
│   │   ├── use-macros.md
│   │   └── use-templates.md
│   ├── index.md
│   ├── internals/
│   │   ├── architecture/
│   │   │   ├── analysis.md
│   │   │   ├── code.md
│   │   │   ├── data.md
│   │   │   ├── exec.md
│   │   │   ├── fuzz.md
│   │   │   ├── isa.md
│   │   │   ├── logging.md
│   │   │   ├── mini.md
│   │   │   ├── model.md
│   │   │   └── overview.md
│   │   ├── code-structure.md
│   │   ├── contributing/
│   │   │   ├── code-style.md
│   │   │   ├── general.md
│   │   │   ├── git.md
│   │   │   └── overview.md
│   │   ├── index.md
│   │   └── model-backends/
│   │       ├── model-dr.md
│   │       └── model-unicorn.md
│   ├── intro/
│   │   ├── 01-overview.md
│   │   ├── 02-install.md
│   │   ├── 03-primer.md
│   │   ├── 04-tutorials.md
│   │   ├── start-here.md
│   │   └── tutorials/
│   │       ├── 01-first-fuzz.md
│   │       ├── 02-first-vuln.md
│   │       ├── 03-faults.md
│   │       ├── 04-isolation.md
│   │       ├── 05-extending.md
│   │       └── tsa-sq.md
│   ├── ref/
│   │   ├── artifact-file-formats.md
│   │   ├── binary-formats.md
│   │   ├── cli.md
│   │   ├── config.md
│   │   ├── index.md
│   │   ├── macros.md
│   │   ├── minimization-passes.md
│   │   ├── modes.md
│   │   ├── papers.md
│   │   ├── registers.md
│   │   ├── runtime-statistic.md
│   │   └── sandbox.md
│   ├── structure.md
│   ├── stylesheets/
│   │   └── extra.css
│   └── topics/
│       ├── actors.md
│       ├── contracts.md
│       ├── models.md
│       ├── test-case-generation.md
│       └── trace-analysis.md
├── mkdocs.yml
├── pyproject.toml
├── revizor.py
├── rvzr/
│   ├── __init__.py
│   ├── analyser.py
│   ├── arch/
│   │   ├── __init__.py
│   │   ├── arm64/
│   │   │   ├── __init__.py
│   │   │   ├── asm_parser.py
│   │   │   ├── config.py
│   │   │   ├── executor.py
│   │   │   ├── fuzzer.py
│   │   │   ├── generator.py
│   │   │   ├── get_spec.py
│   │   │   └── target_desc.py
│   │   └── x86/
│   │       ├── __init__.py
│   │       ├── asm_parser.py
│   │       ├── config.py
│   │       ├── executor.py
│   │       ├── fuzzer.py
│   │       ├── generator.py
│   │       ├── get_spec.py
│   │       └── target_desc.py
│   ├── asm_parser.py
│   ├── cli.py
│   ├── code_generator.py
│   ├── config.py
│   ├── data_generator.py
│   ├── elf_parser.py
│   ├── executor.py
│   ├── executor_km/
│   │   ├── .clang-format
│   │   ├── .gitignore
│   │   ├── Makefile
│   │   ├── arm64/
│   │   │   ├── asm_snippets.h
│   │   │   ├── entry_exit_points.h
│   │   │   ├── exception.S
│   │   │   ├── fault_handler.c
│   │   │   ├── macros.c
│   │   │   ├── page_tables_guest.c
│   │   │   ├── perf_counters.c
│   │   │   ├── registers.h
│   │   │   └── special_registers.c
│   │   ├── code_loader.c
│   │   ├── data_loader.c
│   │   ├── include/
│   │   │   ├── actor.h
│   │   │   ├── asm_snippets.h
│   │   │   ├── code_loader.h
│   │   │   ├── data_loader.h
│   │   │   ├── fault_handler.h
│   │   │   ├── hardware_desc.h
│   │   │   ├── input_parser.h
│   │   │   ├── macro_expansion.h
│   │   │   ├── main.h
│   │   │   ├── measurement.h
│   │   │   ├── page_tables_common.h
│   │   │   ├── page_tables_guest.h
│   │   │   ├── page_tables_host.h
│   │   │   ├── perf_counters.h
│   │   │   ├── sandbox_constants.h
│   │   │   ├── sandbox_manager.h
│   │   │   ├── shortcuts.h
│   │   │   ├── special_registers.h
│   │   │   ├── svm.h
│   │   │   ├── svm_constants.h
│   │   │   ├── test_case_parser.h
│   │   │   ├── vmx.h
│   │   │   └── vmx_config.h
│   │   ├── input_parser.c
│   │   ├── macro_expansion.c
│   │   ├── main.c
│   │   ├── measurement.c
│   │   ├── page_tables_host.c
│   │   ├── readme.md
│   │   ├── sandbox_manager.c
│   │   ├── test_case_parser.c
│   │   └── x86/
│   │       ├── asm_snippets.h
│   │       ├── entry_exit_points.h
│   │       ├── fault_handlers.S
│   │       ├── idt.c
│   │       ├── macros.c
│   │       ├── page_tables_guest.c
│   │       ├── perf_counters.c
│   │       ├── registers.h
│   │       ├── special_registers.c
│   │       ├── svm.c
│   │       └── vmx.c
│   ├── factory.py
│   ├── fuzzer.py
│   ├── instruction_spec.py
│   ├── isa_spec.py
│   ├── logs.py
│   ├── model.py
│   ├── model_dynamorio/
│   │   ├── Makefile
│   │   ├── __init__.py
│   │   ├── adapter/
│   │   │   ├── .clang-format
│   │   │   ├── .clang-tidy
│   │   │   ├── CMakeLists.txt
│   │   │   ├── main.c
│   │   │   ├── parser.c
│   │   │   ├── parser.h
│   │   │   ├── rcbf.h
│   │   │   ├── rdbf.h
│   │   │   ├── sandbox.c
│   │   │   ├── sandbox.h
│   │   │   ├── sandbox_const.h
│   │   │   └── test_case_entry.S
│   │   ├── backend/
│   │   │   ├── .clang-format
│   │   │   ├── .clang-tidy
│   │   │   ├── CMakeLists.txt
│   │   │   ├── cli.cpp
│   │   │   ├── dispatcher.cpp
│   │   │   ├── factory.cpp
│   │   │   ├── include/
│   │   │   │   ├── cli.hpp
│   │   │   │   ├── dispatcher.hpp
│   │   │   │   ├── factory.hpp
│   │   │   │   ├── logger.hpp
│   │   │   │   ├── observables.hpp
│   │   │   │   ├── speculator_abc.hpp
│   │   │   │   ├── speculators/
│   │   │   │   │   ├── cond.hpp
│   │   │   │   │   └── seq.hpp
│   │   │   │   ├── taint_tracker.hpp
│   │   │   │   ├── tracer_abc.hpp
│   │   │   │   ├── tracers/
│   │   │   │   │   ├── ct.hpp
│   │   │   │   │   ├── ind.hpp
│   │   │   │   │   └── pc.hpp
│   │   │   │   ├── types/
│   │   │   │   │   ├── debug_trace.hpp
│   │   │   │   │   ├── decoder.hpp
│   │   │   │   │   ├── file_buffer.hpp
│   │   │   │   │   ├── input_taint.hpp
│   │   │   │   │   ├── store_log.hpp
│   │   │   │   │   └── trace.hpp
│   │   │   │   └── util.hpp
│   │   │   ├── logger.cpp
│   │   │   ├── model.cpp
│   │   │   ├── speculator_abc.cpp
│   │   │   ├── speculators/
│   │   │   │   ├── cond.cpp
│   │   │   │   └── seq.cpp
│   │   │   ├── taint_tracker.cpp
│   │   │   ├── tracer_abc.cpp
│   │   │   ├── tracers/
│   │   │   │   ├── ct.cpp
│   │   │   │   ├── ind.cpp
│   │   │   │   └── pc.cpp
│   │   │   └── util.cpp
│   │   ├── model.py
│   │   └── trace_decoder.py
│   ├── model_unicorn/
│   │   ├── __init__.py
│   │   ├── coverage.py
│   │   ├── execution_context.py
│   │   ├── interpreter.py
│   │   ├── model.py
│   │   ├── speculator_abc.py
│   │   ├── speculators_basic.py
│   │   ├── speculators_fault.py
│   │   ├── speculators_vs.py
│   │   ├── taint_tracker.py
│   │   └── tracer.py
│   ├── postprocessing/
│   │   ├── __init__.py
│   │   ├── analysis_passes.py
│   │   ├── input_passes.py
│   │   ├── instruction_passes.py
│   │   ├── minimizer.py
│   │   ├── pass_abc.py
│   │   └── progress_printer.py
│   ├── py.typed
│   ├── sandbox.py
│   ├── stats.py
│   ├── target_desc.py
│   ├── tc_components/
│   │   ├── __init__.py
│   │   ├── actor.py
│   │   ├── instruction.py
│   │   ├── test_case_binary.py
│   │   ├── test_case_code.py
│   │   └── test_case_data.py
│   ├── traces.py
│   └── unicorn.pyi
└── tests/
    ├── .coveragerc
    ├── .gitignore
    ├── __init__.py
    ├── acceptance.bats
    ├── arm64/
    │   ├── asm/
    │   │   ├── actor_switch.asm
    │   │   ├── asm_basic.asm
    │   │   ├── asm_multiactor.asm
    │   │   ├── asm_symbol.asm
    │   │   ├── calls.asm
    │   │   ├── direct_jumps.asm
    │   │   ├── fault-div-zero-speculation.asm
    │   │   ├── fault_undefined_opcode.asm
    │   │   ├── macro_fault_handler.asm
    │   │   ├── model_flags_match.asm
    │   │   ├── model_match.asm
    │   │   ├── model_match_memory.asm
    │   │   ├── model_match_xmm.asm
    │   │   └── spectre_v1.asm
    │   ├── configs/
    │   │   ├── arch-actors.yaml
    │   │   ├── arch-faults.yaml
    │   │   ├── arch.yaml
    │   │   ├── archdiff.yaml
    │   │   ├── base-and-simd-categories.yaml
    │   │   ├── common.yaml
    │   │   ├── ct-cond.yaml
    │   │   ├── ct-seq.yaml
    │   │   ├── exceptions.yaml
    │   │   └── fault-handler.yaml
    │   ├── min_arm64.json
    │   ├── model_common.py
    │   ├── unit_generators.py
    │   └── unit_isa_loader.py
    ├── kernel_module.bats
    ├── pre-release.sh
    ├── quick-test.sh
    ├── runtests.sh
    ├── scripts/
    │   ├── create_rcbf_file.py
    │   └── create_rdbf_file.py
    ├── unit_analyser.py
    ├── unit_docs.py
    ├── unit_fuzzer.py
    ├── unit_isa_loader.py
    ├── unit_stats.py
    ├── unit_tc_components.py
    ├── unit_traces.py
    └── x86_tests/
        ├── __init__.py
        ├── asm/
        │   ├── actor_switch.asm
        │   ├── asm_basic.asm
        │   ├── asm_multiactor.asm
        │   ├── asm_symbol.asm
        │   ├── calls.asm
        │   ├── direct_jumps.asm
        │   ├── fault-div-overflow-speculation.asm
        │   ├── fault-div-zero-speculation.asm
        │   ├── fault_INT1.asm
        │   ├── fault_INT3.asm
        │   ├── fault_UD.asm
        │   ├── fault_load.asm
        │   ├── fault_ooo_mem_access.asm
        │   ├── fault_rmw.asm
        │   ├── macro_fault_handler.asm
        │   ├── minimization-after.asm
        │   ├── minimization-before.asm
        │   ├── model_flags_match.asm
        │   ├── model_match.asm
        │   ├── model_match_memory.asm
        │   ├── model_match_xmm.asm
        │   ├── spectre_ret.asm
        │   ├── spectre_v1.1.asm
        │   ├── spectre_v1.asm
        │   ├── spectre_v1_arch.asm
        │   ├── spectre_v1_independent.asm
        │   ├── spectre_v1_n2.asm
        │   ├── spectre_v2.asm
        │   ├── spectre_v4.asm
        │   └── vm_switch.asm
        ├── configs/
        │   ├── arch-actors.yaml
        │   ├── arch-dr.yaml
        │   ├── arch-faults.yaml
        │   ├── arch.yaml
        │   ├── archdiff.yaml
        │   ├── base-and-simd-categories.yaml
        │   ├── base-categories.yaml
        │   ├── common.yaml
        │   ├── copy.yaml
        │   ├── ct-cond.yaml
        │   ├── ct-deh.yaml
        │   ├── ct-seq.yaml
        │   ├── div-detect.yaml
        │   ├── div-verif.yaml
        │   ├── exceptions.yaml
        │   ├── fault-handler.yaml
        │   ├── l1tf-p-verif.yaml
        │   ├── l1tf-p.yaml
        │   ├── l1tf-w-verif.yaml
        │   ├── l1tf-w.yaml
        │   ├── meltdown-verif.yaml
        │   ├── meltdown.yaml
        │   ├── mpx-verif.yaml
        │   ├── mpx.yaml
        │   ├── ssbp-detect.yaml
        │   ├── ssbp-verif.yaml
        │   └── vm-switch.yaml
        ├── min_x86.json
        ├── model_common.py
        ├── unit_dr_decoder.py
        ├── unit_fuzzer.py
        ├── unit_generators.py
        ├── unit_isa_loader.py
        ├── unit_model.py
        └── unit_taint_tracker.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .editorconfig
================================================
# https://editorconfig.org/

root = true

[*]
indent_style = space
indent_size = 4
insert_final_newline = true
trim_trailing_whitespace = true
end_of_line = lf
charset = utf-8
max_line_length = 100

[*.json]
indent_size = 2
keep_blank_lines_in_code = 0
keep_indents_on_empty_lines = false
keep_line_breaks = true
space_after_colon = true
space_after_comma = true
space_before_colon = true
space_before_comma = false
spaces_within_braces = false
spaces_within_brackets = false
wrap_long_lines = false
insert_final_newline = ignore

[Makefile]
indent_style = tab

[{*.bash,*.zsh,*.sh,*.bats}]
tab_width = 4
binary_ops_start_line = false
keep_column_alignment_padding = false
minify_program = false
redirect_followed_by_space = false
switch_cases_indented = false

[{*.yml,*.yaml}]
indent_size = 2
keep_indents_on_empty_lines = false
keep_line_breaks = true


================================================
FILE: .github/CODEOWNERS
================================================
*       @OleksiiOleksenko


================================================
FILE: .github/workflows/kmodule-build.yaml
================================================
# This workflow will build the kernel module on multiple Ubuntu versions
name: Kmodule Build

on:
  push:
    branches:
      - main
      - main-fixes
      - pre-release
      - dev
  pull_request:
    branches:
      - main
      - main-fixes
      - pre-release
      - dev

jobs:
  km_build:
    permissions:
      contents: read
    strategy:
      fail-fast: false
      matrix:
        include:
          - runner: ubuntu-latest
            name: x86_latest
          - runner: ubuntu-22.04
            name: x86_backward_compatible
          - runner: ubuntu-24.04-arm
            name: arm_latest
          - runner: ubuntu-22.04-arm
            name: arm_backward_compatible
    runs-on: ${{ matrix.runner }}
    name: km_build_${{ matrix.name }}
    steps:
    - uses: actions/checkout@v4
    - name: Install kernel headers
      run: sudo apt-get update && sudo apt-get install -y linux-headers-$(uname -r) linux-headers-generic
    - name: Build kernel module
      run: |
        set -o pipefail
        cd rvzr/executor_km
        make VMBUILD=1 2>&1 | tee build.log
        if grep -q "Error" build.log; then
          echo "Build failed"
          exit 1
        fi


================================================
FILE: .github/workflows/python-lint-and-test.yaml
================================================
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python

name: Python Lint and Test
permissions:
  contents: read

on:
  push:
    branches:
      - main
      - main-fixes
      - pre-release
      - dev
  pull_request:
    branches:
      - main
      - main-fixes
      - pre-release
      - dev

jobs:
  build:

    runs-on: ubuntu-latest
    strategy:
      fail-fast: false
      matrix:
        python-version: ["3.9", "3.13"]

    steps:
    - uses: actions/checkout@v4
    - name: Set up Python ${{ matrix.python-version }}
      uses: actions/setup-python@v5
      with:
        python-version: ${{ matrix.python-version }}
    - name: Install dependencies
      run: |
        python -m pip install --upgrade pip
        python -m pip install flake8 mypy pylint
        python -m pip install .
    - name: Run
      run: |
        ./tests/runtests.sh --skip-km-tests


================================================
FILE: .gitignore
================================================
cmake-build-*/
build/
.vscode/
.mypy_cache/
.lsync*
venv/
**/__pycache__/
base.json
rvzr/arch/x86/*.json
*.code-workspace
*.o
rvzr/generated.asm
generated.asm
generated
rvzr/executor_km/.cache.mk
rvzr/executor_km/measurement.o.ur-safe
dbg/
site
dist/
.cache/
.claude/


================================================
FILE: .gitmodules
================================================


================================================
FILE: .pylintrc
================================================
[MAIN]

# Analyse import fallback blocks. This can be used to support both Python 2 and
# 3 compatible code, which means that the block might have code that exists
# only in one or another interpreter, leading to false positives when analysed.
analyse-fallback-blocks=no

# Clear in-memory caches upon conclusion of linting. Useful if running pylint
# in a server-like mode.
clear-cache-post-run=no

# Load and enable all available extensions. Use --list-extensions to see a list
# all available extensions.
#enable-all-extensions=

# In error mode, messages with a category besides ERROR or FATAL are
# suppressed, and no reports are done by default. Error mode is compatible with
# disabling specific errors.
#errors-only=

# Always return a 0 (non-error) status code, even if lint errors are found.
# This is primarily useful in continuous integration scripts.
#exit-zero=

# A comma-separated list of package or module names from where C extensions may
# be loaded. Extensions are loading into the active Python interpreter and may
# run arbitrary code.
extension-pkg-allow-list=

# A comma-separated list of package or module names from where C extensions may
# be loaded. Extensions are loading into the active Python interpreter and may
# run arbitrary code. (This is an alternative name to extension-pkg-allow-list
# for backward compatibility.)
extension-pkg-whitelist=

# Return non-zero exit code if any of these messages/categories are detected,
# even if score is above --fail-under value. Syntax same as enable. Messages
# specified are enabled, while categories only check already-enabled messages.
fail-on=

# Specify a score threshold under which the program will exit with error.
fail-under=10

# Interpret the stdin as a python script, whose filename needs to be passed as
# the module_or_package argument.
#from-stdin=

# Files or directories to be skipped. They should be base names, not paths.
ignore=CVS

# Add files or directories matching the regular expressions patterns to the
# ignore-list. The regex matches against paths and can be in Posix or Windows
# format. Because '\\' represents the directory delimiter on Windows systems,
# it can't be used as an escape character.
ignore-paths=

# Files or directories matching the regular expression patterns are skipped.
# The regex matches against base names, not paths. The default value ignores
# Emacs file locks
ignore-patterns=^\.#

# List of module names for which member attributes should not be checked and
# will not be imported (useful for modules/projects where namespaces are
# manipulated during runtime and thus existing member attributes cannot be
# deduced by static analysis). It supports qualified module names, as well as
# Unix pattern matching.
ignored-modules=

# Python code to execute, usually for sys.path manipulation such as
# pygtk.require().
#init-hook=

# Use multiple processes to speed up Pylint. Specifying 0 will auto-detect the
# number of processors available to use, and will cap the count on Windows to
# avoid hangs.
jobs=1

# Control the amount of potential inferred values when inferring a single
# object. This can help the performance when dealing with large functions or
# complex, nested conditions.
limit-inference-results=100

# List of plugins (as comma separated values of python module names) to load,
# usually to register additional checkers.
load-plugins=

# Pickle collected data for later comparisons.
persistent=yes

# Resolve imports to .pyi stubs if available. May reduce no-member messages and
# increase not-an-iterable messages.
prefer-stubs=no

# Minimum Python version to use for version dependent checks. Will default to
# the version used to run pylint.
py-version=3.12

# Discover python modules and packages in the file system subtree.
recursive=no

# Add paths to the list of the source roots. Supports globbing patterns. The
# source root is an absolute path or a path relative to the current working
# directory used to determine a package namespace for modules located under the
# source root.
source-roots=

# Allow loading of arbitrary C extensions. Extensions are imported into the
# active Python interpreter and may run arbitrary code.
unsafe-load-any-extension=no

# In verbose mode, extra non-checker-related info will be displayed.
#verbose=


[BASIC]

# Naming style matching correct argument names.
argument-naming-style=snake_case

# Regular expression matching correct argument names. Overrides argument-
# naming-style. If left empty, argument names will be checked with the set
# naming style.
#argument-rgx=

# Naming style matching correct attribute names.
attr-naming-style=snake_case

# Regular expression matching correct attribute names. Overrides attr-naming-
# style. If left empty, attribute names will be checked with the set naming
# style.
#attr-rgx=

# Bad variable names which should always be refused, separated by a comma.
bad-names=foo,
          bar,
          baz,
          toto,
          tutu,
          tata

# Bad variable names regexes, separated by a comma. If names match any regex,
# they will always be refused
bad-names-rgxs=

# Naming style matching correct class attribute names.
class-attribute-naming-style=any

# Regular expression matching correct class attribute names. Overrides class-
# attribute-naming-style. If left empty, class attribute names will be checked
# with the set naming style.
#class-attribute-rgx=

# Naming style matching correct class constant names.
class-const-naming-style=UPPER_CASE

# Regular expression matching correct class constant names. Overrides class-
# const-naming-style. If left empty, class constant names will be checked with
# the set naming style.
#class-const-rgx=

# Naming style matching correct class names.
class-naming-style=PascalCase

# Regular expression matching correct class names. Overrides class-naming-
# style. If left empty, class names will be checked with the set naming style.
#class-rgx=

# Naming style matching correct constant names.
const-naming-style=UPPER_CASE

# Regular expression matching correct constant names. Overrides const-naming-
# style. If left empty, constant names will be checked with the set naming
# style.
#const-rgx=

# Minimum line length for functions/classes that require docstrings, shorter
# ones are exempt.
docstring-min-length=-1

# Naming style matching correct function names.
function-naming-style=snake_case

# Regular expression matching correct function names. Overrides function-
# naming-style. If left empty, function names will be checked with the set
# naming style.
#function-rgx=

# Good variable names which should always be accepted, separated by a comma.
good-names=i,
           j,
           k,
           ex,
           Run,
           _

# Good variable names regexes, separated by a comma. If names match any regex,
# they will always be accepted
good-names-rgxs=

# Include a hint for the correct naming format with invalid-name.
include-naming-hint=no

# Naming style matching correct inline iteration names.
inlinevar-naming-style=any

# Regular expression matching correct inline iteration names. Overrides
# inlinevar-naming-style. If left empty, inline iteration names will be checked
# with the set naming style.
#inlinevar-rgx=

# Naming style matching correct method names.
method-naming-style=snake_case

# Regular expression matching correct method names. Overrides method-naming-
# style. If left empty, method names will be checked with the set naming style.
#method-rgx=

# Naming style matching correct module names.
module-naming-style=snake_case

# Regular expression matching correct module names. Overrides module-naming-
# style. If left empty, module names will be checked with the set naming style.
#module-rgx=

# Colon-delimited sets of names that determine each other's naming style when
# the name regexes allow several styles.
name-group=

# Regular expression which should only match function or class names that do
# not require a docstring.
no-docstring-rgx=^_

# List of decorators that produce properties, such as abc.abstractproperty. Add
# to this list to register other decorators that produce valid properties.
# These decorators are taken in consideration only for invalid-name.
property-classes=abc.abstractproperty

# Regular expression matching correct type alias names. If left empty, type
# alias names will be checked with the set naming style.
#typealias-rgx=

# Regular expression matching correct type variable names. If left empty, type
# variable names will be checked with the set naming style.
#typevar-rgx=

# Naming style matching correct variable names.
variable-naming-style=snake_case

# Regular expression matching correct variable names. Overrides variable-
# naming-style. If left empty, variable names will be checked with the set
# naming style.
#variable-rgx=

[CLASSES]

# Warn about protected attribute access inside special methods
check-protected-access-in-special-methods=no

# List of method names used to declare (i.e. assign) instance attributes.
defining-attr-methods=__init__,
                      __new__,
                      setUp,
                      asyncSetUp,
                      __post_init__

# List of member names, which should be excluded from the protected access
# warning.
exclude-protected=_asdict,_fields,_replace,_source,_make,os._exit

# List of valid names for the first argument in a class method.
valid-classmethod-first-arg=cls

# List of valid names for the first argument in a metaclass class method.
valid-metaclass-classmethod-first-arg=mcs


[DESIGN]

# List of regular expressions of class ancestor names to ignore when counting
# public methods (see R0903)
exclude-too-few-public-methods=

# List of qualified class names to ignore when counting class parents (see
# R0901)
ignored-parents=

# Maximum number of arguments for function / method.
max-args=9  # NOTE: non-default (5) because we rely on data classes with many attributes

# Maximum number of attributes for a class (see R0902).
max-attributes=12  # NOTE: non-default (5) because we rely on data classes with many attributes

# Maximum number of boolean expressions in an if statement (see R0916).
max-bool-expr=5

# Maximum number of branch for function / method body.
max-branches=12

# Maximum number of locals for function / method body.
max-locals=15

# Maximum number of parents for a class (see R0901).
max-parents=7

# Maximum number of public methods for a class (see R0904).
max-public-methods=20

# Maximum number of return / yield for function / method body.
max-returns=6

# Maximum number of statements in function / method body.
max-statements=50

# Minimum number of public methods for a class (see R0903).
min-public-methods=1


[EXCEPTIONS]

# Exceptions that will emit a warning when caught.
overgeneral-exceptions=builtins.BaseException,builtins.Exception


[FORMAT]

# Expected format of line ending, e.g. empty (any line ending), LF or CRLF.
expected-line-ending-format=

# Regexp for a line that is allowed to be longer than the limit.
ignore-long-lines=^\s*(# )?<?https?://\S+>?$

# Number of spaces of indent required inside a hanging or continued line.
indent-after-paren=4

# String used as indentation unit. This is usually "    " (4 spaces) or "\t" (1
# tab).
indent-string='    '

# Maximum number of characters on a single line.
max-line-length=100

# Maximum number of lines in a module.
max-module-lines=1000

# Allow the body of a class to be on the same line as the declaration if body
# contains single statement.
single-line-class-stmt=no

# Allow the body of an if to be on the same line as the test if there is no
# else.
single-line-if-stmt=no


[IMPORTS]

# List of modules that can be imported at any level, not just the top level
# one.
allow-any-import-level=

# Allow explicit reexports by alias from a package __init__.
allow-reexport-from-package=no

# Allow wildcard imports from modules that define __all__.
allow-wildcard-with-all=no

# Deprecated modules which should not be used, separated by a comma.
deprecated-modules=

# Output a graph (.gv or any supported image format) of external dependencies
# to the given file (report RP0402 must not be disabled).
ext-import-graph=

# Output a graph (.gv or any supported image format) of all (i.e. internal and
# external) dependencies to the given file (report RP0402 must not be
# disabled).
import-graph=

# Output a graph (.gv or any supported image format) of internal dependencies
# to the given file (report RP0402 must not be disabled).
int-import-graph=

# Force import order to recognize a module as part of the standard
# compatibility libraries.
known-standard-library=

# Force import order to recognize a module as part of a third party library.
known-third-party=enchant

# Couples of modules and preferred modules, separated by a comma.
preferred-modules=


[LOGGING]

# The type of string formatting that logging methods do. `old` means using %
# formatting, `new` is for `{}` formatting.
logging-format-style=old

# Logging modules to check that the string format arguments are in logging
# function parameter format.
logging-modules=logging


[MESSAGES CONTROL]

# Only show warnings with the listed confidence levels. Leave empty to show
# all. Valid levels: HIGH, CONTROL_FLOW, INFERENCE, INFERENCE_FAILURE,
# UNDEFINED.
confidence=HIGH,
           CONTROL_FLOW,
           INFERENCE,
           INFERENCE_FAILURE,
           UNDEFINED

# Disable the message, report, category or checker with the given id(s). You
# can either give multiple identifiers separated by comma (,) or put this
# option multiple times (only on the command line, not in the configuration
# file where it should appear only once). You can also use "--disable=all" to
# disable everything first and then re-enable specific checks. For example, if
# you want to run only the similarities checker, you can use "--disable=all
# --enable=similarities". If you want to run only the classes checker, but have
# no Warning level messages displayed, use "--disable=all --enable=classes
# --disable=W".
disable=W0511,  # disable warnings on FIXME tag
        # invalid-name: we actively use Final to define read-only attributes,
        # so using UPPERCASE everywhere would lead to messy code
        c0103,
        # use-yield-from: the replacement does not always produce the same result functionally
        # and it breaks the code, so we disable this warning
        r1737,
        # unspecified-encoding: Revizor runs only on Linux, so we don't need to specify encoding
        w1514,
        # too-many-positional-arguments  # NOTE: we use data classes with many attributes
        r0917,
        # too-few-public-methods: we use data classes with many attributes
        r0903,
        # rise-missing-from
        w0707,
        # consider-using-sys-exit: just meh
        r1722,


# Enable the message, report, category or checker with the given id(s). You can
# either give multiple identifier separated by comma (,) or put this option
# multiple time (only on the command line, not in the configuration file where
# it should appear only once). See also the "--disable" option for examples.
enable=


[METHOD_ARGS]

# List of qualified names (i.e., library.method) which require a timeout
# parameter e.g. 'requests.api.get,requests.api.post'
timeout-methods=requests.api.delete,requests.api.get,requests.api.head,requests.api.options,requests.api.patch,requests.api.post,requests.api.put,requests.api.request


[MISCELLANEOUS]

# List of note tags to take in consideration, separated by a comma.
notes=FIXME,
      XXX,
      TODO

# Regular expression of note tags to take in consideration.
notes-rgx=


[REFACTORING]

# Maximum number of nested blocks for function / method body
max-nested-blocks=5

# Complete name of functions that never returns. When checking for
# inconsistent-return-statements if a never returning function is called then
# it will be considered as an explicit return statement and no message will be
# printed.
never-returning-functions=sys.exit,argparse.parse_error

# Let 'consider-using-join' be raised when the separator to join on would be
# non-empty (resulting in expected fixes of the type: ``"- " + " -
# ".join(items)``)
suggest-join-with-non-empty-separator=yes


[REPORTS]

# Python expression which should return a score less than or equal to 10. You
# have access to the variables 'fatal', 'error', 'warning', 'refactor',
# 'convention', and 'info' which contain the number of messages in each
# category, as well as 'statement' which is the total number of statements
# analyzed. This score is used by the global evaluation report (RP0004).
evaluation=max(0, 0 if fatal else 10.0 - ((float(5 * error + warning + refactor + convention) / statement) * 10))

# Template used to display messages. This is a python new-style format string
# used to format the message information. See doc for all details.
msg-template=

# Set the output format. Available formats are: text, parseable, colorized,
# json2 (improved json format), json (old json format) and msvs (visual
# studio). You can also give a reporter class, e.g.
# mypackage.mymodule.MyReporterClass.
#output-format=

# Tells whether to display a full report or only the messages.
reports=no

# Activate the evaluation score.
score=yes


[SIMILARITIES]

# Comments are removed from the similarity computation
ignore-comments=yes

# Docstrings are removed from the similarity computation
ignore-docstrings=yes

# Imports are removed from the similarity computation
ignore-imports=yes

# Signatures are removed from the similarity computation
ignore-signatures=yes

# Minimum lines number of a similarity.
min-similarity-lines=8


[SPELLING]

# Limits count of emitted suggestions for spelling mistakes.
max-spelling-suggestions=4

# Spelling dictionary name. No available dictionaries : You need to install
# both the python package and the system dependency for enchant to work.
spelling-dict=

# List of comma separated words that should be considered directives if they
# appear at the beginning of a comment and should not be checked.
spelling-ignore-comment-directives=fmt: on,fmt: off,noqa:,noqa,nosec,isort:skip,mypy:

# List of comma separated words that should not be checked.
spelling-ignore-words=

# A path to a file that contains the private dictionary; one word per line.
spelling-private-dict-file=

# Tells whether to store unknown words to the private dictionary (see the
# --spelling-private-dict-file option) instead of raising a message.
spelling-store-unknown-words=no


[STRING]

# This flag controls whether inconsistent-quotes generates a warning when the
# character used as a quote delimiter is used inconsistently within a module.
check-quote-consistency=no

# This flag controls whether the implicit-str-concat should generate a warning
# on implicit string concatenation in sequences defined over several lines.
check-str-concat-over-line-jumps=no


[TYPECHECK]

# List of decorators that produce context managers, such as
# contextlib.contextmanager. Add to this list to register other decorators that
# produce valid context managers.
contextmanager-decorators=contextlib.contextmanager

# List of members which are set dynamically and missed by pylint inference
# system, and so shouldn't trigger E1101 when accessed. Python regular
# expressions are accepted.
generated-members=

# Tells whether to warn about missing members when the owner of the attribute
# is inferred to be None.
ignore-none=yes

# This flag controls whether pylint should warn about no-member and similar
# checks whenever an opaque object is returned when inferring. The inference
# can return multiple potential results while evaluating a Python object, but
# some branches might not be evaluated, which results in partial inference. In
# that case, it might be useful to still emit no-member and other checks for
# the rest of the inferred objects.
ignore-on-opaque-inference=yes

# List of symbolic message names to ignore for Mixin members.
ignored-checks-for-mixins=no-member,
                          not-async-context-manager,
                          not-context-manager,
                          attribute-defined-outside-init

# List of class names for which member attributes should not be checked (useful
# for classes with dynamically set attributes). This supports the use of
# qualified names.
ignored-classes=optparse.Values,thread._local,_thread._local,argparse.Namespace

# Show a hint with possible names when a member name was not found. The aspect
# of finding the hint is based on edit distance.
missing-member-hint=yes

# The minimum edit distance a name should have in order to be considered a
# similar match for a missing member name.
missing-member-hint-distance=1

# The total number of similar names that should be taken in consideration when
# showing a hint for a missing member.
missing-member-max-choices=1

# Regex pattern to define which classes are considered mixins.
mixin-class-rgx=.*[Mm]ixin

# List of decorators that change the signature of a decorated function.
signature-mutators=


[VARIABLES]

# List of additional names supposed to be defined in builtins. Remember that
# you should avoid defining new builtins when possible.
additional-builtins=

# Tells whether unused global variables should be treated as a violation.
allow-global-unused-variables=yes

# List of names allowed to shadow builtins
allowed-redefined-builtins=

# List of strings which can identify a callback function by name. A callback
# name must start or end with one of those strings.
callbacks=cb_,
          _cb

# A regular expression matching the name of dummy variables (i.e. expected to
# not be used).
dummy-variables-rgx=_+$|(_[a-zA-Z0-9_]*[a-zA-Z0-9]+?$)|dummy|^ignored_|^unused_

# Argument names that match this expression will be ignored.
ignored-argument-names=_.*|^ignored_|^unused_

# Tells whether we should check for unused import in __init__ files.
init-import=no

# List of qualified module names which can have objects that can redefine
# builtins.
redefining-builtins-modules=six.moves,past.builtins,future.builtins,builtins,io


================================================
FILE: AUTHORS
================================================
Here is an inevitably incomplete list of MUCH-APPRECIATED CONTRIBUTORS:

Oleksii Oleksenko
Boris Koepf
Emanuele Vannacci
Jana Hofmann
Connor Shugg
Marco Guarnieri
Flavien Solt
Brian Fu
Alvise de Faveri Tron


================================================
FILE: CHANGELOG.md
================================================
# Changelog

All notable changes to Revizor will be documented in this file.

The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).

## [2.0.0] - 2026-01-10

### TL;DR

This release contains a major refactoring of the codebase, including many of the core modules. This breaks compatibility with previous versions, hence the major version bump.

In addition, several significant enhancements have been made:

- ARM64 is now fully supported.
- New DynamoRIO-based model backend has been added, which vastly improves ISA coverage on x86.
- The documentation has been fully restructured and expanded.

### Added

#### ARM64 Support
- Full hardware tracing support for ARM64 CPUs (#137)
- ARM64 executor, fuzzer, and code generator implementations
- ARM64 test suite with acceptance and unit tests
- ARM64 ISA specification and target description

#### DynamoRIO Model Backend
- New DynamoRIO-based model backend added, which completely re-implements the leakage modeling functionality
- New tracers: indirect memory access (IND) tracer and poisoning of faulty loads (#133)
- Contract-based input generation for DynamoRIO backend (#138)

#### Documentation
- Complete documentation restructure with tutorials, reference guides, and topic guides
- Five comprehensive tutorials covering first fuzzing campaign, vulnerability detection, fault handling, isolation, and extending Revizor
- Detailed primer on contracts and leakage models
- In-depth guides on choosing contracts, designing campaigns, interpreting results, and root-causing violations
- Architecture overview with detailed diagrams
- DynamoRIO backend instrumentation diagrams
- Sandbox and binary format documentation
- Actor and test case generation topics
- Glossary of key terms

#### Demos and Examples
- TSA-L1D demo configuration and template
- TSA-SQ demo files
- Improved detection demos for various Spectre variants

#### Testing and Development
- Unified tests for Unicorn and DynamoRIO backends
- Unit tests for traces, stats, and test case components
- Utility scripts for generating RCBF/RDBF test files
- Interface to run individual testing stages
- Improved test coverage and CI integration

#### Misc. Features
- Special value generation option for input data (not just random values)
- More verbose configuration error messages
- Better visibility for warnings in logger output
- Support for FS/GS segment register instructions in ISA specification
- Input differential minimization for observer actors

### Changed

**WARNING**: This release contains breaking changes! The release introduces a complete refactoring of the code structure, including many of the core modules. See docs/internals/architecture/overview.md for details.

#### Code Structure
- Renamed source directory from src/ to rvzr/ for better compliance with Python packaging standards
- Encapsulated all core components into dedicated modules (sandbox.py, actor.py, etc)
- Moved all test case components into a dedicated directory rvzr/tc_components
- Refactored fuzzer.py to isolate the multi-stage filtering logic into a dedicated class
- Isolated utility classes into dedicated modules stats.py and logs.py
- Unicorn-based backend split into logical classes: Tracer, Speculator, TaintTracker, etc. (rvzr/model_unicorn)
- Reorganized into architecture-specific subdirectories (rvzr/arch/x86, rvzr/arch/arm64)
- Minimizer refactored to encapsulate each pass into a separate class (rvzr/postprocessing)
- Executor KM is now shared between x86 and ARM to avoid code duplication
- Consistent naming conventions for generators across architectures
- Improved code style and formatting

#### Configuration Options
- Many config options have been renamed during the refactoring process
- Refer to the updated documentation (`docs/ref/config.md`)for the new option names and their usage.

#### ISA Spec Format
- Renamed several fields in the json produced by the download_spec command

#### Testing Infrastructure
- Cleaner interface for test scripts
- GitHub Actions aligned with internal test scripts

#### Documentation Structure
- Reorganized into intro/, howto/, ref/, topics/, and internals/ sections
- Split architecture documentation into per-module pages
- Updated navigation structure in MkDocs


### Deprecated

- MPX support

---

## [1.3.2] - 2024-09-12

See git history for changes in version 1.3.2 and earlier.

[1.3.3]: https://github.com/microsoft/side-channel-fuzzer/compare/v1.3.2...v1.3.3
[1.3.2]: https://github.com/microsoft/side-channel-fuzzer/releases/tag/v1.3.2


================================================
FILE: CODE_OF_CONDUCT.md
================================================
# Microsoft Open Source Code of Conduct

This project has adopted the [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/).

Resources:

- [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/)
- [Microsoft Code of Conduct FAQ](https://opensource.microsoft.com/codeofconduct/faq/)
- Contact [opencode@microsoft.com](mailto:opencode@microsoft.com) with questions or concerns

================================================
FILE: CONTRIBUTING.md
================================================
# Contributing

As an open source project, Revizor welcomes contributions and suggestions.

## Contributor License Agreement and Code of Conduct

Most contributions require you to agree to a
Contributor License Agreement (CLA) declaring that you have the right to, and actually do, grant us
the rights to use your contribution. For details, visit https://cla.opensource.microsoft.com.

When you submit a pull request, a CLA bot will automatically determine whether you need to provide
a CLA and decorate the PR appropriately (e.g., status check, comment). Simply follow the instructions
provided by the bot. You will only need to do this once across all repos using our CLA.

This project has adopted the [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/).
For more information see the [Code of Conduct FAQ](https://opensource.microsoft.com/codeofconduct/faq/) or
contact [opencode@microsoft.com](mailto:opencode@microsoft.com) with any additional questions or comments.

## Contribution Guidelines

Please refer to the [Guide to Contributing](https://microsoft.github.io/side-channel-fuzzer/internals/contributing/overview/) for an overview of how to contribute.


================================================
FILE: LICENSE
================================================
    MIT License

    Copyright (c) Microsoft Corporation.

    Permission is hereby granted, free of charge, to any person obtaining a copy
    of this software and associated documentation files (the "Software"), to deal
    in the Software without restriction, including without limitation the rights
    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    copies of the Software, and to permit persons to whom the Software is
    furnished to do so, subject to the following conditions:

    The above copyright notice and this permission notice shall be included in all
    copies or substantial portions of the Software.

    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
    SOFTWARE


================================================
FILE: README.md
================================================
# Revizor

![GitHub](https://img.shields.io/github/license/microsoft/side-channel-fuzzer)
![GitHub all releases](https://img.shields.io/github/downloads/microsoft/side-channel-fuzzer/total)
![GitHub contributors](https://img.shields.io/github/contributors/microsoft/side-channel-fuzzer)
![PyPI](https://img.shields.io/pypi/v/revizor-fuzzer?label=PyPI)
![PyPI - Downloads](https://img.shields.io/pypi/dm/revizor-fuzzer?label=%22PyPI%20Downloads%22)

Revizor is a security-oriented fuzzer for detecting information leaks in CPUs, such as [Spectre and Meltdown](https://meltdownattack.com/).
It tests CPUs against [Leakage Contracts](https://arxiv.org/abs/2006.03841) and searches for unexpected leaks.

<!-- For more details, see our [Paper](https://dl.acm.org/doi/10.1145/3503222.3507729) (open access [here](https://arxiv.org/abs/2105.06872)), and the follow-up papers ([1](https://arxiv.org/pdf/2301.07642.pdf), [2](https://www.usenix.org/conference/usenixsecurity23/presentation/hofmann)). -->

## Getting Started and Documentation

You can find a quick start guide at [Quick Start](https://microsoft.github.io/side-channel-fuzzer/intro/start-here/).

For detailed information on how to use Revizor, see [Documentation Pages](https://microsoft.github.io/side-channel-fuzzer/structure/).

For information on how to contribute to Revizor, see [CONTRIBUTING.md](CONTRIBUTING.md).

## Need Help with Revizor?

If you find a bug in Revizor, don't hesitate to [open an issue](https://github.com/microsoft/side-channel-fuzzer/issues).

If something is confusing or you need help in using Revizor, we have a [discussion page](https://github.com/microsoft/side-channel-fuzzer/discussions).

## Citing Revizor

To cite this project, you can use any of the following references:

1. Original paper that introduced the concept of Model-based Relation Testing as well as the Revizor tool:

    Oleksii Oleksenko, Christof Fetzer, Boris Köpf, Mark Silberstein. "[Revizor: Testing Black-box CPUs against Speculation Contracts](https://www.microsoft.com/en-us/research/publication/revizor-testing-black-box-cpus-against-speculation-contracts/)" in Proceedings of the 27th ACM International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS), 2022.

2. Theoretical foundations of leakage contract:

    Marco Guarnieri, Boris Köpf, Jan Reineke, and Pepe Vila. "[Hardware-software contracts for secure speculation](https://www.microsoft.com/en-us/research/publication/hardware-software-contracts-for-secure-speculation/)" in Proceedings of the 2021 IEEE Symposium on Security and Privacy (SP), 2021.

3. Accessible summary of the two papers above, in a journal format:

    Oleksii Oleksenko, Christof Fetzer, Boris Köpf, Mark Silberstein. "Revizor: Testing Black-box CPUs against Speculation Contracts". In IEEE Micro, 2023.

4. Paper that introduced speculation filtering, observation filtering, and contract-based input generation:

    Oleksii Oleksenko, Marco Guarnieri, Boris Köpf, and Mark Silberstein. "[Hide and Seek with Spectres: Efficient discovery of speculative information leaks with random testing](https://www.microsoft.com/en-us/research/publication/hide-and-seek-with-spectres-efficient-discovery-of-speculative-information-leaks-with-random-testing/)" in Proceedings of the 2023 IEEE Symposium on Security and Privacy (SP), 2022.

5. Paper that introduced exception-based testing (i.e., focus on Meltdown, Foreshadow) into Revizor:

    Jana Hofmann, Emanuele Vannacci, Cédric Fournet, Boris Köpf, and Oleksii Oleksenko. "[Speculation at Fault: Modeling and Testing Microarchitectural Leakage of CPU Exceptions.](https://www.usenix.org/conference/usenixsecurity23/presentation/hofmann)" in Proceedings of 32nd USENIX Security Symposium (USENIX Security), 2023.

6. Paper that introduced testing of cross-VM and user-kernel leaks in Revizor, as well as presented TSA attacks on AMD CPUs:

    Oleksii Oleksenko, Flavien Solt, Cédric Fournet, Jana Hofmann, Boris Köpf, and Stavros Volos. "[Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://www.microsoft.com/en-us/research/wp-content/uploads/2025/07/Enter-Exit-SP26.pdf)" (to be published) in Proceedings of the 2026 IEEE Symposium on Security and Privacy (SP), 2026.

## Trademarks

This project may contain trademarks or logos for projects, products, or services. Authorized use of Microsoft
trademarks or logos is subject to and must follow
[Microsoft's Trademark & Brand Guidelines](https://www.microsoft.com/en-us/legal/intellectualproperty/trademarks/usage/general).
Use of Microsoft trademarks or logos in modified versions of this project must not cause confusion or imply Microsoft sponsorship.
Any use of third-party trademarks or logos are subject to those third-party's policies.


================================================
FILE: SECURITY.md
================================================
<!-- BEGIN MICROSOFT SECURITY.MD V0.0.5 BLOCK -->

## Security

Microsoft takes the security of our software products and services seriously, which includes all source code repositories managed through our GitHub organizations, which include [Microsoft](https://github.com/Microsoft), [Azure](https://github.com/Azure), [DotNet](https://github.com/dotnet), [AspNet](https://github.com/aspnet), [Xamarin](https://github.com/xamarin), and [our GitHub organizations](https://opensource.microsoft.com/).

If you believe you have found a security vulnerability in any Microsoft-owned repository that meets [Microsoft's definition of a security vulnerability](https://docs.microsoft.com/en-us/previous-versions/tn-archive/cc751383(v=technet.10)), please report it to us as described below.

## Reporting Security Issues

**Please do not report security vulnerabilities through public GitHub issues.**

Instead, please report them to the Microsoft Security Response Center (MSRC) at [https://msrc.microsoft.com/create-report](https://msrc.microsoft.com/create-report).

If you prefer to submit without logging in, send email to [secure@microsoft.com](mailto:secure@microsoft.com).  If possible, encrypt your message with our PGP key; please download it from the [Microsoft Security Response Center PGP Key page](https://www.microsoft.com/en-us/msrc/pgp-key-msrc).

You should receive a response within 24 hours. If for some reason you do not, please follow up via email to ensure we received your original message. Additional information can be found at [microsoft.com/msrc](https://www.microsoft.com/msrc). 

Please include the requested information listed below (as much as you can provide) to help us better understand the nature and scope of the possible issue:

  * Type of issue (e.g. buffer overflow, SQL injection, cross-site scripting, etc.)
  * Full paths of source file(s) related to the manifestation of the issue
  * The location of the affected source code (tag/branch/commit or direct URL)
  * Any special configuration required to reproduce the issue
  * Step-by-step instructions to reproduce the issue
  * Proof-of-concept or exploit code (if possible)
  * Impact of the issue, including how an attacker might exploit the issue

This information will help us triage your report more quickly.

If you are reporting for a bug bounty, more complete reports can contribute to a higher bounty award. Please visit our [Microsoft Bug Bounty Program](https://microsoft.com/msrc/bounty) page for more details about our active programs.

## Preferred Languages

We prefer all communications to be in English.

## Policy

Microsoft follows the principle of [Coordinated Vulnerability Disclosure](https://www.microsoft.com/en-us/msrc/cvd).

<!-- END MICROSOFT SECURITY.MD BLOCK -->

================================================
FILE: demo/README.md
================================================
This directory contains a set of demo configurations for fuzzing various known CPU vulnerabilities using Revizor.
Each config here is intentionally made to detect only one type of vulnerabilities.

For example, if you fuzz an Intel CPU with `detect-v1.yaml`, you will likely detect an instance of Spectre V1.
(of course, there is always a chance that you will find a new previously-unknown vulnerability with this config, but the likelihood is rather low).

The commands below assume that the ISA spec (downloaded via `rvzr download_spec`) is stored in `base.json`.

## [Spectre V1](https://meltdownattack.com/)

```
rvzr fuzz -s base.json -c demo/detect-v1.yaml -i 50 -n 10000
```
Expected duration - several seconds.

## Spectre V1 (store variant)

```
rvzr fuzz -s base.json -c demo/detect-v1-store.yaml -i 50 -n 10000
```
Expected duration - several seconds.

## Spectre V1-Var ([description](https://dl.acm.org/doi/10.1145/3503222.3507729) and [here](https://eprint.iacr.org/2022/715.pdf))

```
rvzr fuzz -s base.json -c demo/detect-v1-var.yaml -i 50 -n 10000
```
Expected duration - several hours.

## [MDS](https://mdsattacks.com/) or [LVI-Null](https://lviattack.eu/), depending on the CPU model

Note: only Intel CPUs.

```
rvzr fuzz -s base.json -c demo/detect-mds.yaml -i 50 -n 10000
```
Expected duration - several minutes.

## Spectre V4 ([description](https://www.cyberus-technology.de/posts/2018-05-22-intel-store-load-spectre-vulnerability.html))
```
rvzr fuzz -s base.json -c demo/detect-v4.yaml -i 50 -n 10000
```
Expected duration - 5-20 minutes.

## Zero Divisor Injection (ZDI)

Note: only Intel CPUs.

```
rvzr fuzz -s base.json -c demo/detect-zdi.yaml -i 50 -n 10000
```
Expected duration - several minutes.

## String Comparison Overrun (SCO)

```
rvzr fuzz -s base.json -c demo/detect-sco.yaml -i 50 -n 10000
```
Expected duration - several minutes.

## Foreshadow (simplified version)

Note: only Intel CPUs.

```
rvzr fuzz -s base.json -c demo/detect-foreshadow.yaml -i 50 -n 10000
```
Expected duration - several minutes.

## Transient Scheduler Attack, Store Queue variant (TSA-SQ)

Note: only AMD CPUs vulnerable to TSA.

```
rvzr tfuzz -s base.json -c demo/tsa-sq/config.yaml -t demo/tsa-sq/template.asm -i 50 -n 10000
```
Expected duration - several minutes.

## Transient Scheduler Attack, L1D Cache variant (TSA-L1D)

Note: only AMD CPUs vulnerable to TSA.

```
rvzr tfuzz -s base.json -c demo/tsa-l1d/config.yaml -t demo/tsa-l1d/template.asm -i 50 -n 10000
``
Expected duration - several minutes.


================================================
FILE: demo/big-fuzz.yaml
================================================
instruction_set: x86-64

# Model
contract_observation_clause: ct
contract_execution_clause:
  - seq

# Actors
actors:
  - main:
    - data_properties:
      - present: true

# Executor
executor_mode: P+P
x86_executor_enable_ssbp_patch: true

# Program generator
program_size: 64
avg_mem_accesses: 16
max_bb_per_function: 1  # straight-line code only
min_bb_per_function: 1
min_successors_per_bb: 1
max_successors_per_bb: 1

instruction_categories:
  - BASE-BINARY
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-COND_BR
  - BASE-CONVERT
  - BASE-DATAXFER
  - BASE-FLAGOP
  - BASE-LOGICAL
  - BASE-MISC
  - BASE-NOP
  - BASE-WIDENOP
  - BASE-POP
  - BASE-PUSH
  - BASE-SEMAPHORE
  - BASE-SETCC
  # - BASE-STRINGOP  # commented out as it triggers a known information leak
  - LONGMODE-CONVERT
  - LONGMODE-DATAXFER
  - LONGMODE-SEMAPHORE
  # - LONGMODE-STRINGOP  # commented out as it triggers a known information leak
  - SSE-DATAXFER
  - SSE-LOGICAL_FP
  - SSE-MISC
  - SSE-SSE

# Input generator
data_generator_entropy_bits: 24
inputs_per_class: 2

# Fuzzer
enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true
coverage_type: model_instructions

# Output
color: true
logging_modes:
  - info
  - stat
  - dbg_generator
  # - dbg_timestamp
  # - dbg_violation
  # - dbg_dump_htraces
  # - dbg_dump_ctraces
  # - dbg_dump_traces_unlimited
  # - dbg_model
  - dbg_coverage
  # - dbg_priming
  # - dbg_executor_raw


================================================
FILE: demo/detect-foreshadow.yaml
================================================
# This demo illustrates detection of Foreshadow

# contract
contract_observation_clause: loads+stores+pc
contract_execution_clause:
  - delayed-exception-handling

# tested instructions
instruction_categories:
  - BASE-BINARY
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-CONVERT
  - BASE-DATAXFER
  - BASE-LOGICAL
  - BASE-MISC
  - BASE-NOP
  - BASE-POP
  - BASE-PUSH
  - BASE-SETCC

instruction_blocklist_append:
  - DIV
  - IDIV

actors:
  - main:
    - data_properties:
      - present: false
      - writable: false

# misc. fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 16
avg_mem_accesses: 8
inputs_per_class: 2
executor_warmups: 2
x86_disable_div64: false


================================================
FILE: demo/detect-mds.yaml
================================================
# contract
contract_observation_clause: ct
contract_execution_clause:
  - seq-assist

# tested instructions
instruction_categories:
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-LOGICAL

# environment
actors:
  - main:
    - data_properties:
      - accessed: False

# fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 20
avg_mem_accesses: 10
inputs_per_class: 2

program_generator_seed: 955240


================================================
FILE: demo/detect-sco.yaml
================================================
# contract
contract_observation_clause: ct
contract_execution_clause:
  - seq

# tested instructions
instruction_categories:
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-LOGICAL
  - BASE-STRINGOP
  - BASE-FLAGOP

# fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 20
avg_mem_accesses: 10
inputs_per_class: 2


program_generator_seed: 910000


================================================
FILE: demo/detect-v1-store.yaml
================================================
file: !include detect-v1.yaml

# prevent speculative stores from being observed
contract_observation_clause: ct-nonspecstore
contract_execution_clause:
  - cond


================================================
FILE: demo/detect-v1-var.yaml
================================================
file: !include detect-v1.yaml

# contract
# contract_observation_clause: ct
contract_execution_clause:
  - cond
# analyser_subsets_is_violation: false

# # tested instructions
# instruction_categories:
#   - BASE-BITBYTE
#   - BASE-COND_BR
#   - BASE-CMOV
#   - BASE-LOGICAL

# # fuzzing configuration
# enable_speculation_filter: true
# enable_observation_filter: true
# data_generator_entropy_bits: 16
# min_bb_per_function: 2
# max_bb_per_function: 2
# program_size: 20
# avg_mem_accesses: 10
# inputs_per_class: 2


================================================
FILE: demo/detect-v1.yaml
================================================
# contract
contract_observation_clause: loads+stores+pc
contract_execution_clause:
  - no_speculation

# tested instructions
instruction_categories:
  - BASE-BINARY
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-COND_BR
  - BASE-CONVERT
  - BASE-DATAXFER
  - BASE-LOGICAL
  - BASE-MISC
  - BASE-NOP
  - BASE-POP
  - BASE-PUSH
  - BASE-SETCC

# fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 16
avg_mem_accesses: 8
inputs_per_class: 2

program_generator_seed: 100


================================================
FILE: demo/detect-v4.yaml
================================================
# contract
contract_observation_clause: ct
contract_execution_clause:
  - seq

# tested instructions
instruction_categories:
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-LOGICAL

# environment
x86_executor_enable_ssbp_patch: false

# fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 20
avg_mem_accesses: 10
inputs_per_class: 2

# reduce entropy (not strictly required for detection, but makes the demo finish faster)
data_generator_entropy_bits: 10

program_generator_seed: 1000000


================================================
FILE: demo/detect-zdi.yaml
================================================
# contract
contract_observation_clause: ct
contract_execution_clause:
  - seq

# tested instructions
instruction_categories:
  - BASE-BITBYTE
  - BASE-BINARY
  - BASE-CMOV
  - BASE-LOGICAL

# fuzzing configuration
enable_speculation_filter: true
enable_observation_filter: true
program_size: 64
avg_mem_accesses: 24
inputs_per_class: 2

program_generator_seed: 252633
x86_disable_div64: false


================================================
FILE: demo/tsa-l1d/config.yaml
================================================
instruction_set: x86-64
instruction_categories:
  - BASE-BINARY
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-COND_BR
  - BASE-CONVERT
  - BASE-DATAXFER
  - BASE-FLAGOP
  - BASE-LOGICAL
  - BASE-MISC
  - BASE-NOP
  - BASE-POP
  - BASE-PUSH
  - BASE-SEMAPHORE
  - BASE-SETCC
  - BASE-WIDENOP

actors:
  - main:
    - mode: "host"
    - privilege_level: "kernel"
  - vmvictim:
    - mode: "guest"
    - privilege_level: "kernel"
  - vm:
    - mode: "guest"
    - observer: true
    - privilege_level: "kernel"
    - data_properties:
      - writable: false

contract_observation_clause: ct-ni

max_bb_per_function: 1

executor_mode: F+R
executor_sample_sizes:
  - 15
  - 40
  - 160
  - 320

executor_filtering_repetitions: 5
x86_enable_hpa_gpa_collisions: true

program_generator_seed: 20000000
data_generator_seed: 1000000
inputs_per_class: 2

analyser_stat_threshold: 0.1

# enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true

# color: true
logging_modes:
  - info
  # - stat


================================================
FILE: demo/tsa-l1d/template.asm
================================================
.intel_syntax noprefix

# ----------------------------- Hypervisor (Host) ----------------------------
.section .data.main
.function_main_0:
    # observer start
    .macro.set_h2g_target.vm.function_vm_0:
    .macro.set_g2h_target.main.function_main_1:
    .macro.switch_h2g.vm.0:


.function_main_1:
    .macro.landing_g2h.main_1:

    .macro.set_h2g_target.vmvictim.function_vmvictim_0:
    .macro.set_g2h_target.main.function_main_2:
    .macro.switch_h2g.vmvictim.0:

.function_main_2:
    .macro.landing_g2h.main_2:
    .macro.set_h2g_target.vm.function_vm_1:
    .macro.set_g2h_target.main.function_main_3:

    xor rax, rax  # noremove
    xor rbx, rbx  # noremove
    xor rcx, rcx  # noremove
    xor rdx, rdx  # noremove
    xor rsi, rsi  # noremove
    xor rdi, rdi  # noremove
    # insert flushing patches here
.patch_placeholder:

    .macro.switch_h2g.vm.1:

.function_main_3:
    .macro.landing_g2h.main_3:

.macro.fault_handler:
.patch_placeholder_fault_handler:

    .macro.set_h2g_target.vm.function_vm_2:
    .macro.set_g2h_target.main.function_main_4:
    .macro.switch_h2g.vm.2:

.function_main_4:
    .macro.landing_g2h.main_4:
    nop

# ----------------------------- VM - Victim ----------------------------------
.section .data.vmvictim
.function_vmvictim_0:
    .macro.landing_h2g.vmvictim_0:

    # secret injection
    .macro.random_instructions.64.32.main_1:

    .macro.switch_g2h.main.vmvictim_0:
    lfence


# ----------------------------- VM - Observer --------------------------------
.section .data.vm
.function_vm_0:
    .macro.landing_h2g.vm_0:
    .macro.measurement_start:
    .macro.switch_g2h.main.vm_0:
    lfence


.function_vm_1:
    .macro.landing_h2g.vm_1:
    xor rax, rax  # noremove
    mov rax, qword ptr [r14 + 0x2000] # noremove
    mov rbx, qword ptr [r14 + 0x2008] # noremove
    mov rcx, qword ptr [r14 + 0x2010] # noremove
    mov rdx, qword ptr [r14 + 0x2018] # noremove
    mov rsi, qword ptr [r14 + 0x2020] # noremove
    mov rdi, qword ptr [r14 + 0x2028] # noremove
    mfence # noremove

    # secret retrieval
    .macro.random_instructions.64.32.vm_1:

    # make sure the model doesn't attempt to go further than this point
    lfence  # noremove

    .macro.measurement_end.vm_1:
    .macro.switch_g2h.main.1:
    lfence


.function_vm_2:
    .macro.landing_h2g.vm_2:
    .macro.measurement_end.vm_2:
    .macro.switch_g2h.main.2:
    lfence


# ----------------------------- Exit -----------------------------------------
.section .data.main
.test_case_exit:


================================================
FILE: demo/tsa-sq/config.yaml
================================================
instruction_set: x86-64
instruction_categories:
  - BASE-BINARY
  - BASE-BITBYTE
  - BASE-CMOV
  - BASE-COND_BR
  - BASE-CONVERT
  - BASE-DATAXFER
  - BASE-FLAGOP
  - BASE-LOGICAL
  - BASE-MISC
  - BASE-NOP
  - BASE-POP
  - BASE-PUSH
  - BASE-SEMAPHORE
  - BASE-SETCC
  - BASE-WIDENOP


faults_allowlist:
  - user-to-kernel-access

actors:
  - main:
    - mode: "host"
    - privilege_level: "kernel"
    - fault_blocklist:
      - user-to-kernel-access
  - user:
    - mode: "host"
    - observer: true
    - privilege_level: "user"
    - data_properties:
      - present: true

contract_observation_clause: ct-ni

max_bb_per_function: 1

executor_mode: F+R
executor_sample_sizes:
  - 15
  - 40
  - 160
  - 320

executor_filtering_repetitions: 5
x86_enable_hpa_gpa_collisions: true

program_generator_seed: 20000000
data_generator_seed: 1000000
inputs_per_class: 2

analyser_stat_threshold: 0.2

# enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true

# color: true
logging_modes:
  - info
  # - stat


================================================
FILE: demo/tsa-sq/template.asm
================================================
.intel_syntax noprefix

# ----------------------------- Kernel-mode Actor (Victim) -------------------
.section .data.main
.function_main_0:
    # observer start
    .macro.set_k2u_target.user.function_user_0:
    .macro.set_u2k_target.main.function_main_1:
    .macro.switch_k2u.user.0:


.function_main_1:
    .macro.landing_u2k.main_1:

    # secret injection
    .macro.random_instructions.64.32.main_1:

    .macro.set_k2u_target.user.function_user_1:
    .macro.set_u2k_target.main.function_main_2:
    .macro.switch_k2u.user.1:

.function_main_2:
    .macro.landing_u2k.main_2:

.macro.fault_handler:
    .macro.set_k2u_target.user.function_user_2:
    .macro.set_u2k_target.main.function_main_3:
    .macro.switch_k2u.user.2:

.function_main_3:
    .macro.landing_u2k.main_3:
    nop

# ----------------------------- User-mode Actor ------------------------------
.section .data.user
.function_user_0:
    .macro.landing_k2u.user_0:
    .macro.measurement_start:
    .macro.switch_u2k.main.user_0:
    lfence


.function_user_1:
    .macro.landing_k2u.user_1:
    xor rax, rax  # noremove
    mov rax, qword ptr [r14 + 0x2000] # noremove
    mov rbx, qword ptr [r14 + 0x2008] # noremove
    mov rcx, qword ptr [r14 + 0x2010] # noremove
    mov rdx, qword ptr [r14 + 0x2018] # noremove
    mov rsi, qword ptr [r14 + 0x2020] # noremove
    mov rdi, qword ptr [r14 + 0x2028] # noremove
    lfence

    # secret retrieval
    .macro.random_instructions.64.32.user_1:

    # make sure the model doesn't attempt to go further than this point
    lfence  # noremove

    .macro.measurement_end.user_1:
    .macro.switch_u2k.main.1:
    lfence


.function_user_2:
    .macro.landing_k2u.user_2:
    .macro.measurement_end.user_2:
    .macro.switch_u2k.main.2:
    lfence


# ----------------------------- Exit -----------------------------------------
.section .data.main
.test_case_exit:


================================================
FILE: docs/assets/branches.drawio
================================================
<mxfile host="Electron" modified="2024-07-30T08:53:34.216Z" agent="5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/16.5.1 Chrome/96.0.4664.110 Electron/16.0.7 Safari/537.36" etag="Hyny0YfqRxkr2HCByzIt" version="16.5.1" type="device"><diagram id="RTthD5nFo_tmHNPfYv7S" name="Page-1">3VlZj5swEP41kdpKWQVzJPvYPdqqdxVVbR6d4IBXgFNjNqS/vkMYMARytJtC2pfEHt8z830zNgPzNkxfS7ryPwiXBQMyctOBeTcgxHIM+M0Em1wwGdu5wJPczUWGFkz5T4bCEUoT7rK41lEJESi+qgsXIorYQtVkVEqxrndbiqC+6op6rCGYLmjQlH7jrvJR6tiWbnjDuOfj0sQ0nbwlpEVvPErsU1esKyLzfmDeSiFUXgrTWxZkyisUk497tae13JlkkTplwHRKPw4d/vbNbDE22dcv3rvw8xBneaRBgiceECeA+W6WAqaFXasN6sL5kYiiYRhvLfUSOhjjVaoboeTh/3aWeSEIKY8KIexxvtsRZPmKO+NlIXkWKzqHrZBbWFSygNGYuc9RteUmiRRJ5LLsyAYMWvtcsemKLrLWNXgoyHwVBtjcVGGhDyYVSysiVOlrJkKm5Aa6YKtpoXnRwc0R1tcVdylcwK94ygRlFD3UK6fWNoQCmvE3THrd0AlzwaexKqTyhSciGtxr6Y3W2ghqus97IVaoqwem1AYBShMl6poEBcrN92z8FbGL+qzaeJfi7Hltg7W9JohFIhfswDkJ0gGVHlPHXTxTwkGDgk9RxR/rwD+7dUgTcSGPhGw6PPp4qzXf0znwbM0CNOBeBOUFKJJJEGQ+zIHJXmJDyF03NzYD9G6xlJtgJXiktue0bwb2HUIcTW2MW410yPMa4CnpGRetEWAbqIajK9MgSKQn2wWn+5wdpzIXMWsALevFFGK5jMGBdg1b7uokW8/u0iEXE/fTw718HKbfflzbaeF5HSMx5ep7pTzbgtLGmkZhVilAqNFbhS6OOgBel8Z+ybWtMPu70DZ7RXKXoXO45CnkQQcCqCaOPSH1WRLnARTQGIYcEJ/lUvATsVRtExbAzZUOrr2HVuLUQ6tF+g6tRVbaW2wddxRbzX8ztjYhGdKH/yO2Fq53luBKRrtB0ThLrCXXHYTaQw7bQsYNonwaO68kG5bec+LVpY2229h4mbmqpuOt5xZs3P9Np6Tfy6HjXhKsP2dV63fSmothVasraLns8WmQikS2+jIJgkw7isUK7JwBaq1h1j+O7ItLawqa7ueioi8ns0rLkYtKmfrkFxVy7KZyPOqeCmL7RBBbFwViey+Iz3xZWTKqEoiRL5722Jf5lsxzm1jJZKG4iEoo4xrlBQaIo39YO9c7D4FW77Du57bSCuvRQVjvonMfzMfHYP7nsHb6gnV7Jm1N6t7kjHa8JN8ojjp/Pu10xRfzxPtLXIEvJhdMEXbv3wqMSZ8U0cUT5fkC//hEhiAXFfjHXQHZFwoQp7F8OFff+0Z5Apazh8r+wWwY3aXxUNXfiXOK11/bzftf</diagram></mxfile>

================================================
FILE: docs/assets/dr-instrumentation.drawio
================================================
<mxfile host="Electron" agent="Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/27.0.9 Chrome/134.0.6998.205 Electron/35.4.0 Safari/537.36" version="27.0.9">
  <diagram name="Page-1" id="Q5S100K9i7V5bAyz_BIk">
    <mxGraphModel dx="1376" dy="1102" grid="1" gridSize="10" guides="1" tooltips="1" connect="1" arrows="1" fold="1" page="1" pageScale="1" pageWidth="827" pageHeight="1169" math="0" shadow="0">
      <root>
        <mxCell id="0" />
        <mxCell id="1" parent="0" />
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-28" value="Dispatcher.cpp" style="rounded=1;whiteSpace=wrap;html=1;arcSize=5;verticalAlign=top;fontFamily=JetBrains Mono;fontSize=15;fontStyle=1" parent="1" vertex="1">
          <mxGeometry x="560" y="110" width="380" height="290" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-5" value="Model.cpp" style="rounded=1;whiteSpace=wrap;html=1;arcSize=5;verticalAlign=top;fontFamily=JetBrains Mono;fontSize=15;fontStyle=1" parent="1" vertex="1">
          <mxGeometry x="40" y="110" width="470" height="290" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-7" value="namespace dr_model" style="rounded=1;whiteSpace=wrap;html=1;arcSize=7;verticalAlign=top;fontFamily=JetBrains Mono;fontStyle=1;fillColor=#FFF2CC;" parent="1" vertex="1">
          <mxGeometry x="70" y="180" width="430" height="160" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-27" style="edgeStyle=orthogonalEdgeStyle;rounded=1;orthogonalLoop=1;jettySize=auto;html=1;entryX=0;entryY=0.5;entryDx=0;entryDy=0;exitX=0.5;exitY=1;exitDx=0;exitDy=0;endArrow=none;endFill=1;fontFamily=JetBrains Mono;curved=0;dashed=1;dashPattern=1 1;strokeColor=#666666;startArrow=blockThin;startFill=0;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-10" target="VMTqDSAsTNkDB5RHAwfX-19" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="160" y="276" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-72" value="reads" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="VMTqDSAsTNkDB5RHAwfX-27" vertex="1" connectable="0">
          <mxGeometry x="0.1613" relative="1" as="geometry">
            <mxPoint as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-10" value="&lt;div&gt;instrumented_func.exit_pc&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontSize=9;fontStyle=2" parent="1" vertex="1">
          <mxGeometry x="80" y="235" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-23" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=0;entryY=0.5;entryDx=0;entryDy=0;endArrow=none;endFill=1;fontFamily=JetBrains Mono;dashed=1;dashPattern=1 1;strokeColor=#666666;startArrow=blockThin;startFill=0;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-11" target="VMTqDSAsTNkDB5RHAwfX-18" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-68" value="reads" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="VMTqDSAsTNkDB5RHAwfX-23" vertex="1" connectable="0">
          <mxGeometry x="-0.4408" relative="1" as="geometry">
            <mxPoint x="11" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-11" value="&lt;div&gt;instrumented_func.name&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontSize=9;fontStyle=2" parent="1" vertex="1">
          <mxGeometry x="80" y="215" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-12" value="&lt;div&gt;glob_dispatcher&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontSize=9;fontStyle=2" parent="1" vertex="1">
          <mxGeometry x="80" y="150" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-14" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;endArrow=blockThin;endFill=1;fontFamily=JetBrains Mono;dashed=1;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-13" target="VMTqDSAsTNkDB5RHAwfX-12" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-16" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;endArrow=blockThin;endFill=1;fontFamily=JetBrains Mono;dashed=1;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-13" target="VMTqDSAsTNkDB5RHAwfX-11" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-17" value="initializes" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" parent="VMTqDSAsTNkDB5RHAwfX-16" vertex="1" connectable="0">
          <mxGeometry x="-0.3834" y="-2" relative="1" as="geometry">
            <mxPoint x="31" y="11" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-26" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=0.75;entryY=1;entryDx=0;entryDy=0;exitX=1;exitY=0.5;exitDx=0;exitDy=0;endArrow=blockThin;endFill=1;dashed=1;" edge="1" parent="1" source="VMTqDSAsTNkDB5RHAwfX-13" target="VMTqDSAsTNkDB5RHAwfX-7">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-13" value="&lt;div&gt;dr_client_main()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontStyle=1" parent="1" vertex="1">
          <mxGeometry x="90" y="360" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-25" style="edgeStyle=orthogonalEdgeStyle;rounded=1;orthogonalLoop=1;jettySize=auto;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;entryX=1;entryY=0.5;entryDx=0;entryDy=0;endArrow=blockThin;endFill=1;fontFamily=JetBrains Mono;curved=0;dashed=1;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-18" target="VMTqDSAsTNkDB5RHAwfX-20" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="490" y="225" />
              <mxPoint x="490" y="245" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-73" value="inserts" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="VMTqDSAsTNkDB5RHAwfX-25" vertex="1" connectable="0">
          <mxGeometry x="-0.1333" y="1" relative="1" as="geometry">
            <mxPoint y="-13" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-18" value="&lt;div&gt;event_module_load()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFCE9F;" parent="1" vertex="1">
          <mxGeometry x="310" y="215" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-82" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;endArrow=blockThin;endFill=1;" parent="1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="578.4444444444445" y="261" as="targetPoint" />
            <Array as="points">
              <mxPoint x="470" y="276" />
              <mxPoint x="504" y="276" />
              <mxPoint x="504" y="261" />
            </Array>
            <mxPoint x="470" y="280" as="sourcePoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-83" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;endArrow=blockThin;endFill=1;" parent="1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="577.8888888888889" y="276.33333333333337" as="targetPoint" />
            <Array as="points">
              <mxPoint x="470" y="276" />
            </Array>
            <mxPoint x="470" y="278" as="sourcePoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-19" value="&lt;div&gt;event_bb_instrumentation()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFCE9F;" parent="1" vertex="1">
          <mxGeometry x="310" y="266" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-26" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=1;entryY=0.5;entryDx=0;entryDy=0;endArrow=blockThin;endFill=1;fontFamily=JetBrains Mono;dashed=1;dashPattern=1 1;strokeColor=#666666;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-20" target="VMTqDSAsTNkDB5RHAwfX-10" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-71" value="writes" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="VMTqDSAsTNkDB5RHAwfX-26" vertex="1" connectable="0">
          <mxGeometry x="0.0599" y="-3" relative="1" as="geometry">
            <mxPoint as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-20" value="&lt;div&gt;event_instrumentation_start()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFD966;" parent="1" vertex="1">
          <mxGeometry x="310" y="235" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-21" value="&lt;div&gt;event_signal()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFCE9F;" parent="1" vertex="1">
          <mxGeometry x="310" y="286" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-22" value="&lt;div&gt;event_exit()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFCE9F;" parent="1" vertex="1">
          <mxGeometry x="310" y="306" width="160" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-38" value="Dispatcher" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;whiteSpace=wrap;html=1;fontFamily=JetBrains Mono;" parent="1" vertex="1">
          <mxGeometry x="572" y="151" width="160" height="190" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-39" value="+ logger&lt;div&gt;+ tracer&lt;/div&gt;&lt;div&gt;+ speculator&lt;/div&gt;" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;whiteSpace=wrap;html=1;fontFamily=JetBrains Mono;fontSize=9;" parent="VMTqDSAsTNkDB5RHAwfX-38" vertex="1">
          <mxGeometry y="26" width="160" height="44" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-40" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;strokeColor=inherit;fontFamily=JetBrains Mono;" parent="VMTqDSAsTNkDB5RHAwfX-38" vertex="1">
          <mxGeometry y="70" width="160" height="8" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-61" value="" style="endArrow=blockThin;html=1;rounded=0;endFill=1;fontFamily=JetBrains Mono;entryX=0;entryY=0.5;entryDx=0;entryDy=0;dashed=1;" parent="VMTqDSAsTNkDB5RHAwfX-38" target="VMTqDSAsTNkDB5RHAwfX-45" edge="1">
          <mxGeometry width="50" height="50" relative="1" as="geometry">
            <mxPoint x="110" y="125" as="sourcePoint" />
            <mxPoint x="207" y="117" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-41" value="&lt;div&gt;+ start()&lt;/div&gt;&lt;div&gt;&lt;br&gt;&lt;/div&gt;+ instrument_instruction()&lt;div&gt;+ instrument_exit()&lt;/div&gt;&lt;div&gt;&lt;br&gt;&lt;/div&gt;&lt;div&gt;+ handle_exception()&lt;/div&gt;&lt;div&gt;&lt;br&gt;&lt;/div&gt;&lt;div&gt;+ finalize()&lt;/div&gt;" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;whiteSpace=wrap;html=1;fontFamily=JetBrains Mono;fontSize=9;" parent="VMTqDSAsTNkDB5RHAwfX-38" vertex="1">
          <mxGeometry y="78" width="160" height="112" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-63" style="edgeStyle=orthogonalEdgeStyle;rounded=1;orthogonalLoop=1;jettySize=auto;html=1;endArrow=blockThin;endFill=1;entryX=1.003;entryY=0.896;entryDx=0;entryDy=0;entryPerimeter=0;fontFamily=JetBrains Mono;curved=0;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-44" target="VMTqDSAsTNkDB5RHAwfX-39" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="653.5999999999999" y="198.60000000000002" as="targetPoint" />
            <Array as="points">
              <mxPoint x="860" y="217" />
              <mxPoint x="732" y="217" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-44" value="&lt;div&gt;dispatch_callback()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#F19C99;" parent="1" vertex="1">
          <mxGeometry x="780" y="250.5" width="120" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-62" style="edgeStyle=orthogonalEdgeStyle;rounded=1;orthogonalLoop=1;jettySize=auto;html=1;endArrow=blockThin;endFill=1;fontFamily=JetBrains Mono;curved=0;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-45" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="646" y="319" as="targetPoint" />
            <Array as="points">
              <mxPoint x="840" y="319" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-64" style="edgeStyle=orthogonalEdgeStyle;rounded=1;orthogonalLoop=1;jettySize=auto;html=1;entryX=1;entryY=0.5;entryDx=0;entryDy=0;fontFamily=JetBrains Mono;curved=0;endArrow=blockThin;endFill=1;" parent="1" source="VMTqDSAsTNkDB5RHAwfX-45" target="VMTqDSAsTNkDB5RHAwfX-39" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="659.2" y="210.20000000000005" as="targetPoint" />
            <Array as="points">
              <mxPoint x="840" y="318" />
              <mxPoint x="920" y="318" />
              <mxPoint x="920" y="199" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-45" value="&lt;div&gt;exit_callback()&lt;/div&gt;" style="rounded=1;whiteSpace=wrap;html=1;align=center;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#F19C99;" parent="1" vertex="1">
          <mxGeometry x="780" y="270.5" width="120" height="20" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-59" value="" style="endArrow=blockThin;html=1;rounded=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;endFill=1;fontFamily=JetBrains Mono;dashed=1;" parent="1" target="VMTqDSAsTNkDB5RHAwfX-44" edge="1">
          <mxGeometry width="50" height="50" relative="1" as="geometry">
            <mxPoint x="721" y="264" as="sourcePoint" />
            <mxPoint x="782" y="240" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-75" value="exit_pc?" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="544" y="266" as="geometry">
            <mxPoint x="-7" y="10" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-76" value="calls" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="543" y="250" as="geometry">
            <mxPoint x="-3" y="73" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-77" value="&lt;font color=&quot;#ffffff&quot;&gt;3&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" parent="1" vertex="1">
          <mxGeometry x="470" y="200" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-80" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;4&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" parent="1" vertex="1">
          <mxGeometry x="295" y="238" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-85" value="" style="endArrow=blockThin;html=1;rounded=0;endFill=1;fontFamily=JetBrains Mono;" parent="1" edge="1">
          <mxGeometry width="50" height="50" relative="1" as="geometry">
            <mxPoint x="470" y="297" as="sourcePoint" />
            <mxPoint x="575" y="296" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-88" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;5&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" parent="1" vertex="1">
          <mxGeometry x="479" y="270" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-89" value="" style="endArrow=blockThin;html=1;rounded=0;endFill=1;fontFamily=JetBrains Mono;" parent="1" edge="1">
          <mxGeometry width="50" height="50" relative="1" as="geometry">
            <mxPoint x="470" y="317" as="sourcePoint" />
            <mxPoint x="576" y="317" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-90" value="calls" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="541" y="296" as="geometry">
            <mxPoint y="5" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-91" value="inserts" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="750" y="237" as="geometry">
            <mxPoint x="1" y="52" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-92" value="inserts" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="752" y="255" as="geometry" />
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-93" value="uses" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="262" y="227" as="geometry">
            <mxPoint x="555" y="-2" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-96" value="n: finalize()" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="780" y="305" as="geometry">
            <mxPoint x="-8" y="11" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-97" value="y: rollback()" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="900" y="306" as="geometry">
            <mxPoint x="-18" y="13" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="VMTqDSAsTNkDB5RHAwfX-98" value="is speculative?" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" parent="1" vertex="1" connectable="0">
          <mxGeometry x="907" y="306" as="geometry">
            <mxPoint x="-48" y="-6" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-1" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;endArrow=blockThin;endFill=1;dashed=1;" edge="1" parent="1" source="VMTqDSAsTNkDB5RHAwfX-12">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="574" y="159" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-2" value="&lt;i&gt;points to&lt;/i&gt;" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontSize=9;" vertex="1" connectable="0" parent="jZhf56UUiF3wu5g5-CzG-1">
          <mxGeometry x="-0.5431" y="4" relative="1" as="geometry">
            <mxPoint x="23" y="-5" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-3" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;2&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" vertex="1" parent="1">
          <mxGeometry x="45" y="345" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-15" value="" style="endArrow=blockThin;html=1;rounded=0;endFill=1;" edge="1" parent="1">
          <mxGeometry width="50" height="50" relative="1" as="geometry">
            <mxPoint x="470" y="251" as="sourcePoint" />
            <mxPoint x="578" y="243" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-16" value="calls" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="541" y="232.5" as="geometry">
            <mxPoint y="5" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-17" value="started?" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontStyle=2;fontFamily=JetBrains Mono;fontSize=8;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="544" y="250" as="geometry">
            <mxPoint x="-7" y="10" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-18" value="" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFCE9F;" vertex="1" parent="1">
          <mxGeometry x="70" y="430" width="20" height="20" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-19" value="" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#FFD966;" vertex="1" parent="1">
          <mxGeometry x="210" y="430" width="20" height="20" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-20" value="" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=#F19C99;" vertex="1" parent="1">
          <mxGeometry x="360" y="430" width="20" height="20" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-21" value="" style="rounded=1;whiteSpace=wrap;html=1;align=left;fontFamily=JetBrains Mono;fontSize=9;fontStyle=1;fillColor=none;" vertex="1" parent="1">
          <mxGeometry x="500" y="430" width="20" height="20" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-22" value="initial callbacks" style="edgeLabel;html=1;align=left;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="100" y="440" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-23" value="dynamically-added&lt;div&gt;callbacks&lt;/div&gt;" style="edgeLabel;html=1;align=left;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="240" y="440" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-24" value="execution-time&lt;div&gt;clean calls&lt;/div&gt;" style="edgeLabel;html=1;align=left;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="391" y="440" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-25" value="other components" style="edgeLabel;html=1;align=left;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="531" y="440" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-27" value="installs callbacks" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontFamily=JetBrains Mono;fontStyle=2;fontSize=9;" vertex="1" connectable="0" parent="1">
          <mxGeometry x="337" y="361" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-28" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;1&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" vertex="1" parent="1">
          <mxGeometry x="270" y="356" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-29" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;6&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" vertex="1" parent="1">
          <mxGeometry x="840" y="232.5" width="10" height="10" as="geometry" />
        </mxCell>
        <mxCell id="jZhf56UUiF3wu5g5-CzG-30" value="&lt;font style=&quot;color: rgb(255, 255, 255);&quot;&gt;7&lt;/font&gt;" style="ellipse;whiteSpace=wrap;html=1;aspect=fixed;fillColor=#000000;fontFamily=JetBrains Mono;strokeWidth=6;" vertex="1" parent="1">
          <mxGeometry x="804" y="295" width="10" height="10" as="geometry" />
        </mxCell>
      </root>
    </mxGraphModel>
  </diagram>
</mxfile>


================================================
FILE: docs/assets/dr-model.drawio
================================================
<mxfile host="Electron" agent="Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/27.0.9 Chrome/134.0.6998.205 Electron/35.4.0 Safari/537.36" version="27.0.9">
  <diagram id="C5RBs43oDa-KdzZeNtuy" name="Page-1">
    <mxGraphModel dx="1678" dy="2377" grid="1" gridSize="10" guides="1" tooltips="1" connect="1" arrows="1" fold="1" page="1" pageScale="1" pageWidth="827" pageHeight="1169" math="0" shadow="0">
      <root>
        <mxCell id="WIyWlLk6GJQsqaUBKTNV-0" />
        <mxCell id="WIyWlLk6GJQsqaUBKTNV-1" parent="WIyWlLk6GJQsqaUBKTNV-0" />
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-14" value="&lt;font style=&quot;font-size: 18px&quot;&gt;DynamoRIO Tool&lt;/font&gt;" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;verticalAlign=top;arcSize=6;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="260" y="320" width="930" height="580" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-70" value="" style="rounded=1;whiteSpace=wrap;html=1;fontSize=15;arcSize=8;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="840" y="360" width="330" height="520" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-12" value="&lt;font style=&quot;font-size: 18px&quot;&gt;Python Adapter&lt;/font&gt;" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;verticalAlign=top;arcSize=11;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="201" y="-100" width="550" height="370" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-1" value="DynamoRIOModel" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="391" y="60" width="300" height="90" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-3" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;" parent="QmN-cfn-Gxa06QFyi7zT-1" vertex="1">
          <mxGeometry y="26" width="300" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-4" value="+ configure_clauses(...)&#xa;+ load_test_case(TestCaseProgram)&#xa;+ trace_test_case(List[InputData],...) -&gt; List[CTrace]&#xa;" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;" parent="QmN-cfn-Gxa06QFyi7zT-1" vertex="1">
          <mxGeometry y="34" width="300" height="56" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-10" value="&lt;b&gt;&lt;font style=&quot;font-size: 18px&quot;&gt;Fuzzer&lt;/font&gt;&lt;/b&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="241" y="-80" width="60" height="30" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-11" value="&lt;font style=&quot;font-size: 11px&quot;&gt;TestCaseProgram&lt;br&gt;List[InputData]&lt;/font&gt;" style="html=1;verticalAlign=bottom;endArrow=block;rounded=0;fontSize=25;exitX=0.5;exitY=1;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-10" target="QmN-cfn-Gxa06QFyi7zT-4" edge="1">
          <mxGeometry x="0.0186" y="13" width="80" relative="1" as="geometry">
            <mxPoint x="381" y="-50" as="sourcePoint" />
            <mxPoint x="461" y="-50" as="targetPoint" />
            <mxPoint as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-13" value="&lt;font style=&quot;font-size: 18px&quot;&gt;Test Case Loader&lt;/font&gt;" style="rounded=1;whiteSpace=wrap;html=1;fontSize=11;verticalAlign=top;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="843" y="-100" width="300" height="350" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-46" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=0.5;entryY=1;entryDx=0;entryDy=0;fontSize=12;dashed=1;exitX=0.588;exitY=0.001;exitDx=0;exitDy=0;exitPerimeter=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" target="QmN-cfn-Gxa06QFyi7zT-13" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="869.8400000000001" y="320.62000000000035" as="sourcePoint" />
            <Array as="points">
              <mxPoint x="870" y="290" />
              <mxPoint x="993" y="290" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-47" value="Instrument Binary" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-46" vertex="1" connectable="0">
          <mxGeometry x="0.2028" y="-2" relative="1" as="geometry">
            <mxPoint x="-22" y="-7" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-19" value="parser.c" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="873" y="-20" width="230" height="70" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-21" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-19" vertex="1">
          <mxGeometry y="26" width="230" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-22" value="+ parse_rcbf(file): rcbf_t*&#xa;+ parse_rdbf(file): rdbf_t*" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-19" vertex="1">
          <mxGeometry y="34" width="230" height="36" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-26" value="sandbox.c" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="873" y="70" width="230" height="70" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-27" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-26" vertex="1">
          <mxGeometry y="26" width="230" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-28" value="+ load_code_in_sandbox(rcbf_t*)&#xa;+ load_data_in_sandbox(rdbf_t*)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-26" vertex="1">
          <mxGeometry y="34" width="230" height="36" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-30" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;fontSize=12;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-22" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="873" y="110" as="targetPoint" />
            <Array as="points">
              <mxPoint x="853" y="32" />
              <mxPoint x="853" y="110" />
              <mxPoint x="873" y="110" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-31" value="test_case_entry.c" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="873" y="160" width="230" height="60" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-32" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-31" vertex="1">
          <mxGeometry y="26" width="230" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-33" value="+ test_case_entry(sandbox_t*)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-31" vertex="1">
          <mxGeometry y="34" width="230" height="26" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-38" value="&lt;b&gt;&lt;font style=&quot;font-size: 18px&quot;&gt;Postprocessor&lt;/font&gt;&lt;/b&gt;" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="241" y="200" width="60" height="30" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-39" value="&lt;font style=&quot;font-size: 11px&quot;&gt;TestCaseProgram&lt;br&gt;List[InputData]&lt;/font&gt;" style="html=1;verticalAlign=bottom;endArrow=block;rounded=0;fontSize=25;exitX=0.5;exitY=0;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-38" target="QmN-cfn-Gxa06QFyi7zT-4" edge="1">
          <mxGeometry x="-0.2384" y="-12" width="80" relative="1" as="geometry">
            <mxPoint x="281" y="-40" as="sourcePoint" />
            <mxPoint x="351" y="121.02400000000034" as="targetPoint" />
            <mxPoint y="-1" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-40" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=0;entryY=0.25;entryDx=0;entryDy=0;fontSize=12;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-4" target="QmN-cfn-Gxa06QFyi7zT-13" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-42" value="RCBF File&lt;br&gt;RDBF File" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontSize=12;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="690" y="90" width="60" height="30" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-48" value="model.cpp" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="934" y="405" width="200" height="110" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-49" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-48" vertex="1">
          <mxGeometry y="26" width="200" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-50" value="+ event_bb_instrumentation(...)&#xa;+ event_instrumentation_start(...)&#xa;+ event_instrumentation_end(...)&#xa;+ event_signal()" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-48" vertex="1">
          <mxGeometry y="34" width="200" height="76" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-52" value="Dispatcher" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="934" y="565" width="200" height="110" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-53" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-52" vertex="1">
          <mxGeometry y="26" width="200" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-54" value="+ instrument_instruction(...)&#xa;+ start(...)&#xa;+ finalize(...)&#xa;+ handle_exception(...)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-52" vertex="1">
          <mxGeometry y="34" width="200" height="76" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-57" value="Instrumentation Components" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontSize=15;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="907" y="360" width="210" height="30" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-61" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;entryX=0;entryY=0.5;entryDx=0;entryDy=0;fontSize=15;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-28" target="QmN-cfn-Gxa06QFyi7zT-33" edge="1">
          <mxGeometry relative="1" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-62" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=1;exitY=0.5;exitDx=0;exitDy=0;entryX=0.5;entryY=0;entryDx=0;entryDy=0;fontSize=15;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-50" target="QmN-cfn-Gxa06QFyi7zT-52" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="1150" y="467" />
              <mxPoint x="1150" y="530" />
              <mxPoint x="1034" y="530" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-69" value="" style="rounded=1;whiteSpace=wrap;html=1;fontSize=15;arcSize=7;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="280" y="360" width="550" height="520" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-63" value="Execution-time Components" style="text;html=1;strokeColor=none;fillColor=none;align=center;verticalAlign=middle;whiteSpace=wrap;rounded=0;fontSize=15;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="460" y="360" width="210" height="30" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-64" value="dispatcher.cpp" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="633" y="390" width="170" height="100" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-65" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-64" vertex="1">
          <mxGeometry y="26" width="170" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-66" value="+ dispatch_callback(...)&#xa;+ mem_access_dispatch(...)&#xa;+ instruction_dispatch(...)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-64" vertex="1">
          <mxGeometry y="34" width="170" height="66" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-68" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;entryX=1;entryY=0.5;entryDx=0;entryDy=0;fontSize=15;dashed=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-54" target="QmN-cfn-Gxa06QFyi7zT-66" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="934" y="587" />
              <mxPoint x="850" y="587" />
              <mxPoint x="850" y="457" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-71" value="&lt;font style=&quot;font-size: 8px;&quot;&gt;add calls to&lt;br style=&quot;font-size: 8px;&quot;&gt;dispatch_callback()&lt;br style=&quot;font-size: 8px;&quot;&gt;forevery instruction&lt;br style=&quot;font-size: 8px;&quot;&gt;&lt;/font&gt;" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontSize=8;" parent="QmN-cfn-Gxa06QFyi7zT-68" vertex="1" connectable="0">
          <mxGeometry x="-0.6126" y="1" relative="1" as="geometry">
            <mxPoint x="-44" y="-37" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-74" value="TracerABC" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="301" y="537" width="230" height="120" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-75" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-74" vertex="1">
          <mxGeometry y="26" width="230" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-76" value="+ tracing_star(...)&#xa;+ tracing_finalize(...)&#xa;+ observe_instruction(...)&#xa;+ observe_mem_access(...)&#xa;+ observe_exception(...)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-74" vertex="1">
          <mxGeometry y="34" width="230" height="86" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-77" value="SpeculatorABC" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="590" y="540" width="170" height="120" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-78" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-77" vertex="1">
          <mxGeometry y="26" width="170" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-79" value="+ handle_instruction(...)&#xa;+ handle_mem_access(...)&#xa;+ handle_exception(...)&#xa;- checkpoint()&#xa;- rollback()" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-77" vertex="1">
          <mxGeometry y="34" width="170" height="86" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-81" value="" style="html=1;verticalAlign=bottom;endArrow=block;rounded=0;fontSize=8;exitX=0.235;exitY=1.031;exitDx=0;exitDy=0;exitPerimeter=0;entryX=0.5;entryY=0;entryDx=0;entryDy=0;curved=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-66" target="QmN-cfn-Gxa06QFyi7zT-74" edge="1">
          <mxGeometry width="80" relative="1" as="geometry">
            <mxPoint x="660" y="560" as="sourcePoint" />
            <mxPoint x="740" y="560" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-82" value="dispatch instruction/mem. access" style="html=1;verticalAlign=bottom;endArrow=block;rounded=0;fontSize=9;exitX=0.245;exitY=1.01;exitDx=0;exitDy=0;exitPerimeter=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-66" target="QmN-cfn-Gxa06QFyi7zT-77" edge="1">
          <mxGeometry x="-0.2193" y="-25" width="80" relative="1" as="geometry">
            <mxPoint x="699.94" y="512.0160000000001" as="sourcePoint" />
            <mxPoint x="445" y="550" as="targetPoint" />
            <mxPoint as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-83" value="TracerCT" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="301" y="697" width="230" height="80" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-84" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-83" vertex="1">
          <mxGeometry y="26" width="230" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-85" value="+ observe_instruction(...)&#xa;+ observe_mem_access(...)" style="text;strokeColor=none;fillColor=none;align=left;verticalAlign=top;spacingLeft=4;spacingRight=4;overflow=hidden;rotatable=0;points=[[0,0.5],[1,0.5]];portConstraint=eastwest;fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-83" vertex="1">
          <mxGeometry y="34" width="230" height="46" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-86" value="" style="endArrow=block;dashed=1;endFill=0;endSize=12;html=1;rounded=0;fontSize=8;entryX=0.5;entryY=1;entryDx=0;entryDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-83" target="QmN-cfn-Gxa06QFyi7zT-74" edge="1">
          <mxGeometry width="160" relative="1" as="geometry">
            <mxPoint x="461" y="607" as="sourcePoint" />
            <mxPoint x="621" y="607" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-90" value="SpeculatorSeq" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="566" y="713" width="140" height="34" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-91" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-90" vertex="1">
          <mxGeometry y="26" width="140" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-93" value="SpeculatorCond" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="588" y="763" width="160" height="34" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-94" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-93" vertex="1">
          <mxGeometry y="26" width="160" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-95" value="SpeculatorBpas" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="643" y="813" width="160" height="34" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-96" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="QmN-cfn-Gxa06QFyi7zT-95" vertex="1">
          <mxGeometry y="26" width="160" height="8" as="geometry" />
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-97" value="" style="endArrow=block;dashed=1;endFill=0;endSize=12;html=1;rounded=0;fontSize=8;exitX=0.5;exitY=0;exitDx=0;exitDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-90" edge="1">
          <mxGeometry width="160" relative="1" as="geometry">
            <mxPoint x="680.71" y="660" as="sourcePoint" />
            <mxPoint x="676" y="660" as="targetPoint" />
            <Array as="points">
              <mxPoint x="636" y="680" />
              <mxPoint x="676" y="680" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-98" value="" style="endArrow=block;dashed=1;endFill=0;endSize=12;html=1;rounded=0;fontSize=8;exitX=0.829;exitY=0.013;exitDx=0;exitDy=0;exitPerimeter=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-93" edge="1">
          <mxGeometry width="160" relative="1" as="geometry">
            <mxPoint x="646" y="670" as="sourcePoint" />
            <mxPoint x="676" y="660" as="targetPoint" />
            <Array as="points">
              <mxPoint x="721" y="680" />
              <mxPoint x="676" y="680" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-99" value="" style="endArrow=block;dashed=1;endFill=0;endSize=12;html=1;rounded=0;fontSize=8;exitX=0.75;exitY=0;exitDx=0;exitDy=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" source="QmN-cfn-Gxa06QFyi7zT-95" edge="1">
          <mxGeometry width="160" relative="1" as="geometry">
            <mxPoint x="731" y="720" as="sourcePoint" />
            <mxPoint x="676" y="660" as="targetPoint" />
            <Array as="points">
              <mxPoint x="766" y="680" />
              <mxPoint x="676" y="680" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-100" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;fontSize=12;dashed=1;exitX=0.004;exitY=0.379;exitDx=0;exitDy=0;exitPerimeter=0;endArrow=block;endFill=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="296.97999999999985" y="603.594" as="sourcePoint" />
            <mxPoint x="534.06" y="150" as="targetPoint" />
            <Array as="points">
              <mxPoint x="245.06" y="604" />
              <mxPoint x="245.06" y="297" />
              <mxPoint x="534.06" y="297" />
            </Array>
          </mxGeometry>
        </mxCell>
        <mxCell id="QmN-cfn-Gxa06QFyi7zT-101" value="&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; TRACE File&amp;nbsp;&amp;nbsp;" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontSize=12;" parent="QmN-cfn-Gxa06QFyi7zT-100" vertex="1" connectable="0">
          <mxGeometry x="0.2028" y="-2" relative="1" as="geometry">
            <mxPoint x="66" y="-3" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-20" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;dashed=1;endArrow=none;startFill=0;strokeColor=#666666;" parent="WIyWlLk6GJQsqaUBKTNV-1" target="uKMc0L07USMBdFAgg4Kt-19" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="421" y="340" />
              <mxPoint x="585" y="340" />
            </Array>
            <mxPoint x="421" y="410" as="sourcePoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-3" value="Logger" style="swimlane;fontStyle=1;align=center;verticalAlign=top;childLayout=stackLayout;horizontal=1;startSize=26;horizontalStack=0;resizeParent=1;resizeParentMax=0;resizeLast=0;collapsible=1;marginBottom=0;fontSize=18;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="379" y="410" width="120" height="34" as="geometry" />
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-4" value="" style="line;strokeWidth=1;fillColor=none;align=left;verticalAlign=middle;spacingTop=-1;spacingLeft=3;spacingRight=3;rotatable=0;labelPosition=right;points=[];portConstraint=eastwest;fontSize=18;" parent="uKMc0L07USMBdFAgg4Kt-3" vertex="1">
          <mxGeometry y="26" width="120" height="8" as="geometry" />
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-11" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=1;entryY=0.5;entryDx=0;entryDy=0;dashed=1;endArrow=block;endFill=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="550" y="416" />
              <mxPoint x="550" y="416" />
            </Array>
            <mxPoint x="633" y="416" as="sourcePoint" />
            <mxPoint x="499" y="416" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-12" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;entryX=1;entryY=0.042;entryDx=0;entryDy=0;dashed=1;endArrow=block;endFill=1;entryPerimeter=0;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <Array as="points">
              <mxPoint x="549" y="616" />
              <mxPoint x="549" y="438" />
              <mxPoint x="499" y="438" />
            </Array>
            <mxPoint x="531" y="616" as="sourcePoint" />
            <mxPoint x="499" y="438.336" as="targetPoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-13" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;exitX=0;exitY=0.5;exitDx=0;exitDy=0;dashed=1;endArrow=block;endFill=1;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="499" y="427" as="targetPoint" />
            <Array as="points">
              <mxPoint x="569" y="617" />
              <mxPoint x="569" y="427" />
            </Array>
            <mxPoint x="589" y="617" as="sourcePoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-15" value="&lt;font&gt;Log Events&lt;/font&gt;" style="edgeLabel;html=1;align=center;verticalAlign=middle;resizable=0;points=[];fontSize=9;" parent="uKMc0L07USMBdFAgg4Kt-13" vertex="1" connectable="0">
          <mxGeometry x="-0.4384" y="-2" relative="1" as="geometry">
            <mxPoint x="-31" y="-153" as="offset" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-16" value="" style="sketch=0;outlineConnect=0;fontColor=#232F3E;gradientColor=none;fillColor=#232F3D;strokeColor=none;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;fontSize=12;fontStyle=0;aspect=fixed;pointerEvents=1;shape=mxgraph.aws4.document;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="386" y="285" width="17.54" height="24" as="geometry" />
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-19" value="" style="sketch=0;outlineConnect=0;fontColor=#232F3E;gradientColor=none;fillColor=#666666;strokeColor=none;dashed=0;verticalLabelPosition=bottom;verticalAlign=top;align=center;html=1;fontSize=12;fontStyle=0;aspect=fixed;pointerEvents=1;shape=mxgraph.aws4.document;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="578" y="285" width="16.08" height="22" as="geometry" />
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-21" style="edgeStyle=orthogonalEdgeStyle;rounded=0;orthogonalLoop=1;jettySize=auto;html=1;dashed=1;endArrow=block;endFill=1;strokeColor=#666666;" parent="WIyWlLk6GJQsqaUBKTNV-1" edge="1">
          <mxGeometry relative="1" as="geometry">
            <mxPoint x="585.8" y="150.5" as="targetPoint" />
            <mxPoint x="585.8" y="283.5" as="sourcePoint" />
          </mxGeometry>
        </mxCell>
        <mxCell id="uKMc0L07USMBdFAgg4Kt-22" value="&lt;span style=&quot;background-color: rgb(255, 255, 255);&quot;&gt;Debug Trace&lt;/span&gt;&lt;div&gt;&lt;span style=&quot;background-color: rgb(255, 255, 255);&quot;&gt;(optional)&lt;/span&gt;&lt;/div&gt;" style="text;html=1;align=center;verticalAlign=middle;resizable=0;points=[];autosize=1;strokeColor=none;fillColor=none;fontColor=#666666;" parent="WIyWlLk6GJQsqaUBKTNV-1" vertex="1">
          <mxGeometry x="594.08" y="276" width="90" height="40" as="geometry" />
        </mxCell>
      </root>
    </mxGraphModel>
  </diagram>
</mxfile>


================================================
FILE: docs/assets/fuzzing-flow.drawio
================================================
<mxfile host="Electron" modified="2025-02-14T10:47:35.820Z" agent="5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/16.5.1 Chrome/96.0.4664.110 Electron/16.0.7 Safari/537.36" etag="RKLjlPN-6zBEMbTxfot0" version="16.5.1" type="device"><diagram id="C5RBs43oDa-KdzZeNtuy" name="Page-1">7V1bd+K2Fv41rJXzQJav4DwGkplOD+1JJ5mm85Sl2ALcMRa1RQLz64+EZWNL8gWwIEnd1dViIWRb37582tra6ZnjxfpzBJbz35AHg56heeueedMzDMOxHfI/2rJJWnTD1pKWWeR7rG3XcO//hKwx7bbyPRgXOmKEAuwvi40uCkPo4kIbiCL0Wuw2RUHxrkswg0LDvQsCsfXR9/A8aXWM4a79F+jP5umd9cFV8s0CpJ3Zm8Rz4KHXXJN52zPHEUI4+bRYj2FAZy+dl8cvm8dg8mPw+dc/4n/At9F/H37/s58M9mmfn2SvEMEQHzz094enyQj8sL3RYGpF3vL201pjP9FeQLBi8+UG/uVyw94Yb9JpjF/9RQBCcjWaohDfs290cg0CfxaSzy55OhiRhhcYYZ8gcM2+wGhJWt25H3gTsEEr+g4xBu6P9Go0R5H/kwwLAjYm+TrCTJiMQaHHPf0ladZIawRj0ucunRida/oNrAsdJyDGrMFFQQCWsf+cvcYCRDM/HCGM0YJ1ajjvDB/62nCdkzqGw2eIFhBHZE619FuLzTtTqvTydSeghsba5jnhHLA2wHRilo28w518YNDvIQamIAY9Y7TVAT+8+I8gDOQ18RakCP2AYxQggvpNiBLp8IOAa0oFJIBTXCoe8RK4fjibbPvcWLuWr+z9aRMiv50GWyWc+54HQwotwgCDBEcK2hL5Id5OkD0i/5IpG2uXds8mDz4m1/rumvxLu0d4jELyLuRd6X0gEZJXSAVFgn+lEtXjz/AmEt0I77Rf63gbErw5jAN/i12CcWo59YMAXhCoArhD9IECftPXBdRNEXVTgnAAnmFwh2If+4iOHyV9OeTPBa5tNAPXUYStNagHF3rER7JLMkVzNEMhCG53rWTOV6EHPTbjuz4TtAWPYvc3xHjDbDRYYUStNF6kFpzMarT5K3/xnQ52adjp9U1qnJOrDbvaupdkVH2wtxGmb9bEBPfJkxjpzDDk+ilniWAAsP9SZBAyoNjwd1Twys17RpnSIWK0ilzIfpV32fxA2qWW+8dISUs67hU3LnGaM4iFca+jCGxy3Zie7P38pY/J978q9Ccfkifgfp0+DppOY4h7vNxnmDVThWB95/cfvz0+j/94+Pb39Ffv6jp1aycW/LWP/9qKus2uvue+2Qk9vZDIvJPXHTZGpj01qiNVgea6k4hPhWnRbblOHakvhu60oy/8QLauRkH4+5iDagVxtKruRf1oS/ZFL9Anlw/E941BDO8iNIvAomcMAuoLnyPyaZZ4xaTF818KmjP4Z0XXOSNK/frM31+THluXn32bjkJvNfGJm7VHX8LlCt8Q/71lYMng5IW246e3lCjphPr4omLVrjMynrFl+6WU8EZUuBIfn61K2Vi9bC1YoA2lpqfK+9jDYdGa6634nr5V9GmWWRxBnbHVB2elGVrvYJrhnMB0ltGRI+E2D6Qa+1q8svuUWTyhfxUlaEsC0+njbB4zROOHCLgwZ4V2Ri/X65ddrw9olRIdrSTF2qBVs9Su3ZGudwTQp6ufP2FEo1jm9aftZwHMLpzVZjjLLCq77kjiWYZkCTxUFc8aCjKRxLO2OFxcXl52Ma2asIfVWAgqYloyzE1VMa0GYY8upnUguANJTEsGrrKY1llX8unnhFmmq/ralfwB0auErVVMhN40zHXsMmJwqQ9zoaehWbDwpnZoRItzFVlIq+0QVsl9lPLPK8ECCcvtd84py3WzOtB6HIdMR7oq/kIdpXQEIF3kwacZDGEEMGLUckzaPqdNHcNUyTD7GVWsopiOxCMp2zJNQ4sd36g3EU5jvCvIpAxdVXxDFyMJyQLCjSDA8AmT139yiWFnawmtvwtmijHWbqXRqnCYVjPhaGX3XObnNQHSN0pGc/tIRmEjKYucqtlIqqexDMLasKmlhN1myWllUdO2WKhjF2kz8xFKWajMdCUBT8pDerJNHfpFP95KHt3TcZZrcUunejsnGfp8+znH0dpSJa9itUPrWF6bpR2citfqhiAbHoGSJ7YU3o7YnojY8qZoaIveTRZqqSK27HZfqeCHM/Jeu/vZxdtZRsNQLe9MQUAQDgkXGlHHFiuRVllWYsewqzW79XitMoot7tskFJsZI3jB82qpB+q4dbtiISPXTexBa+TaPie5Jl49n7SVEeo6dr0XuW4386CeaytK2uIirEKuVeOkLT5Uq4qMc67PLKYk1D6XeYoUBjHyKGYvvPMYcqnSV5Ftx3CuCmi0lC1lFAdVkixVrpQFoBf07FVCwNkxrI54KyTeA54IX4mOTxpyVBZQLktaCBDwchFHLrxIWBJxxaaeTBbtj6mlyP1AwptKqFW5kel4lVx9W49oW6rSI/QuP0IhvEOjofVQha5IHOAauqsspnPLrjqvotKrGG/Pq4hJCZ3a1ynRu9mnTAn2GTlDecJ0xxmOlK6mG53KOIMkoR6EINhk2dXX9Cru8qvVehVrWL9HYO67R3CcYIgbSZ1XqVOiY7yKFF5lXqWsHARBjqjs04uPaNSFTMuFuHAc51wDLrRKUmX+TEfqnEfbQiRxHlIhUldjQtzgCdAs3h3LmaDZrHMdp3UdsrxJqVgoO5pjiJHPznXUqdD7cR2yKNNoG6in87FzHReZ6e+OYrUuBU1tv7KzWGaD1A0Yete0vhu15wGIY9/tFTawipu6h5bEOKQax37GuHYDlk18s1xHo/5oTw5VWwJq2nbs/i53gls/dH+Xd0GZJNbs77a11WaKPISe9/5yT1Md4yV0t1iTGc0dCz8wR5KO66Jw6s+yMeWmLSfmLVm5zM+9zn0M75dgK5KvEVgKqiTdzVUQC+UFSBOphyyaYapiHuZ5ClQwA9SntZyMXj5529CHlXaorCrQvhW16KB3MPLJNFLWrMLGNc3ndhrauGMrcHGid2Wf1uTItnJzdXUSa+HH4Inan2RF9IVyhJVLGdE9zTloo1JOSk7bTv2opSypqjXOEanK/Ui5A5cufaSIWFbxF+pyPUxxb04XkQwCfxmXGfActvwBY36NnHcdPcOcOi50XcHPkG+eHduylW6GaZwWGpKw5UkdgLgXJqGlHw8IblNSt0+Ig7ROjwCD5Hj/uWGQmK5myJTCoFtc+caBJBZzShxEYmz9K3DQuFNZsu2UU+KgS9yBemL6XmpOOkoYIm8UD6/RynHNLOWj7ZqTJQ9cmr7M9a+rUWlplf0VnVUUXUFXpfKU9eBqiyQrKlNp6UWl4ZRPYZXKM9cENpqfLzn1ORE1hlbnU+JMzj42Pidi11jslgytWX3uo/a59u3PGXJFhlbkev+Ogpe1xYne88kS6RuL+6uSI3Ufj9WbvBoOJVuhJ2X1w7N6mkKkuXGZkOFbPsmYhgmUVw05Lroh7n3m0py0/30l//md7ul8SHs7rLO3A61Vc3sCgyqGbyUbSR/QoHJhEsMWzzKcNmwochiJif2AQHBVhLKqQmcD4jxn9Esq/b+1Qv8lJdaPLfTPrxpMozhE43QM/o+R8KVc21pGlTyw2r8AIKaflacYfwR/a9SenH9LBf3J5e7PZSbdd3911Lz9Pw==</diagram></mxfile>

================================================
FILE: docs/assets/tsa-sq-template.drawio
================================================
<mxfile host="Electron" modified="2025-07-21T10:25:41.035Z" agent="5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/16.5.1 Chrome/96.0.4664.110 Electron/16.0.7 Safari/537.36" etag="BbGekvxkDWImu01GMpuU" version="16.5.1" type="device"><diagram id="VUT32xMhq3pvxhd0Flhl" name="Page-1">7Vtdc5s4FP01nmkfkjESYPvRcZJmptnZzma7m33qyCAbpoBcIcf2/vqVQHxJ2CYOJiTZvsS6EgKde+7RvYIO4CzcfqFo5f1GXBwMwNDdDuD1AADDHkH+R1h20jIEk9SypL4rbYXhwf8XZwOlde27OK4MZIQEzF9VjQ6JIuywig1RSjbVYQsSVO+6QkusGR4cFOjWv32XednCLLPouMP+0pO3BhDaaU+IstFyKbGHXLIpmeDNAM4oISz9FW5nOBDwZcCk193u6c2fjOKINblgeDe9uDccYzeZjR7t9TSOx8sLMEqneULBWi5ZPi3bZRhQso5cLGYxBvBq4/kMP6yQI3o33O3c5rEwkN0LPwhmJCA0uRYuFgvgONweM0p+4lKPa89ty+Y9+jrk0p4wZXhbMsl1fcEkxIzu+BDZC22JcUazDPNN4TMwlDav5C4zuxBJnizzuQsk+Q8J5nOAtc8LrGvhsWvWATsGc2i3BKzRP2ANDdevmEaJ7qTgATvgD3E1p/zXUvz6hBwmwJkmUelHnzVHcDRYFe0qqhGJsOICaUKBv4x40+EYY26/Etj6XD+msiP0XVfcpta9BQGGYnoSsQf5UDXR/Wzn5cqTOQ+amvPGNb6DZ4sJzXXfYw4aGIqN47Df1nzgR/GbaRz3m1EXdGdznFWjZdJbmbNEYP0YZmZ+l7zngOwNj8veUUcxsmpH63Id2yntMuygS9jrtpAUX9d/KuBNTfEKRaot94EIn33eyW11M3Bz6V63998f7hJnirRJD9gVxcIFIh9DjofTkQzrgdtTCpgqBWBDCpxtt2uQnuHInYpMVyAUoDj2nSp8Vaw5OHT3WG78IxqXVta83pY7r3eytRddhugSswNLkOKB3UqmrfughLFVA3FmozhAzH+q5ud1uMs7fCM+f+Iio1HEFRhWdYqYrKmD5VXldFqdCFrVicYKB1JgtIkSGuTLPp0ZY40Zf+JYPN8MxSLybqKMf/3bMVsI1bGyR471SLW71OqJ5o5kRzR0lawKdsk59q+1qAWTfOJiIx9aJD8RoSEKigHZTH/5DvPDpPqtzZ8oilwS8pra/bxX5jsQ5tbzWlWlJ6+t0pmmqN4/VPK9HXzzfPT18NWLvgRf+C7wtZpmGWcTL0OvzJKMEbShXklSpUrXHzf3v0+v96eSR9LSl2vnJ74RUl5gCmiihRjEfBK9K51Us1lz9OpxrBeSC7QO2A+P71SBOAp4gzBrcmm+eji3XDgag5cWjlPGkPOzYabyNmtFaL16dLVfLG599ih7xO9SqchbRaUoGlmhuK/ABCdXmGlFdmDhUlWOVqIyLHpSidpgjzw/txK1R8pEQJnozJWooZeiLfFuWOHdqCHxjM6IZzck3qRXxINQUa7hiUcg6kE1BMpE5yaeXnSfRfCaEq87xZs0JJ7RL8lTmZfvoS9lXteSl93u40me0VTzMg/1lHoQtiV6ZreiB/SzkLNQ7zTmHSOe9rXC7S3k/0RlgmIv/xaiC372672ERqvRifzUNbZjfupnSRo/s6LsHs1x8I3Evjh74V1zwhgJ91Zt5bcWHlqJycLtUnx5djlHnOSXC052b6B9K5NzbC+tnlP2mYqfBOnVwm+k88SA+ynxsq8q4EfNgoymhV92vvl/rLcc62Yf9qIXEMjoFS+AUsgbp54IqC+5ra5zFP2cV3k5zf2nMeW9vpu2at6fdfpuGpytTu59tQKa7hD9UgJN2EfgsqV6xZy0pQW8WXy9ng4v/hcAvPkP</diagram></mxfile>

================================================
FILE: docs/assets/unicorn-model-state-machine.drawio
================================================
<mxfile host="Electron" modified="2024-11-12T17:35:30.054Z" agent="5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) draw.io/16.5.1 Chrome/96.0.4664.110 Electron/16.0.7 Safari/537.36" etag="H7DxQGuZ2p2YCU2e7pUZ" version="16.5.1" type="device"><diagram id="Uj5UJ1iNXtTnnK9jLXeE" name="Page-1">7Vxbc5s4FP41nml3phmQuD4mTtzONOtmm3S23ZeOYmSbLUZeITdxf/0KEBcDBmyMgaTuTApHEhyk7zs6R7cRHK+e31O0Xv5JLOyMgGQ9j+D1CAAgQZn/50u2oUQGqhRKFtS2hCwR3Nu/sBBG2Ta2hb2djIwQh9nrXeGMuC6esR0ZopQ87WabE2f3rWu0wDnB/Qw5eenftsWWQqqpSpLwAduLpXg1gFALU1Yoyi0+xVsiizylRPBmBMeUEBZerZ7H2PGrL6qYsNxkT2qsGcUuq1Pgr6+f7pzF9uP0++zLP9PF+8ndVnkn60I5to0+GVu8BsQtoWxJFsRFzk0ivaJk41rYf6zE75I8t4SsuVDmwn8xY1vRnGjDCBct2coRqfjZZl/94hequPuWSrl+Fk8ObrbRjcvoNiwE1Oj+WzoxKRfcRQU9RskPPCYOocEHwskE8h9PCT/d/969VSpEHtnQGS6rR4FNRBeYleTT4obnnMFkhbmmvBzFDmL2z109kMDuIs6XtC6/EA18SGOHz/2JnI140x/89o4/TJoSukL8AZrDtb96pPxq4V/5GS5dX8X7NZ7lsLKLhKelzfD9GgU19cQtwm6rI8deuPzawXMW1/5PTBl+Lq//fH2JAtAU8BXmRYm49pTiaiRbpmiqSS1VsV9+cHxqRidJmkwk6bR0AjXppHdJJ7CfTje8povJ1EcaGVFv2xsaRX7DgGgkNyIR5DTStNOSCNYkkaw0ZFFQ9JJStE1lWBPbZV7qyXe+IAGdLIFd1KlSxn/JFlDkhgUMpaIA0EBZAX4RfmUC7Li6GmD9GDMyJe47r4emxNT6ZkqUIfbIDT3cNrpkZQhdsrKfSx+QazmYDqdX1vS+UQkMr1du6ty2ESuqNZnUaayoHsmkvnZMKuwdm7TfbDoBm7SabDK7cHLVjA3X5HIPVDFBWf52HFAwxDHA4QJRlnqBRLUciZoBy/K3hERjKEjsF6L2dH1nRhSsiK5lGZYVaAlS5m9IHQMp2AtIVQzYmFlEnWW8RhoKol5Gdwl6gcTs5GrWuMEsFMEZoCjqMBWkff4yzaEzwZ5cHXnNbcdJtfx8PgezWREmLO1RU5MR62bBWXZkF3YdnCmd+sRyiuLRYOBAhw31mjTvpL8x1QzuFLW8v8nkVypmIEyzNH87RkHp1Ik+Frr6cKHbSQfVFLrQqICuVJq/Jeh26qy/Quh2MvPbGLpaOXR1rTR/O9BVO40KXiF01UFCt2L8VwOl+VuCbqfTeq8Qup0M1zWFLjArpi4MvSx/O9AVr0wHwJ9ub68uxx9zkO5/FKzD3kXBPRrqkuoahoZBsKZdgcnktIbB6LM7BjOwgxWDrno2MjjHoKswVsNC4nCB2IlzlQNihZ+vmh34+UqPVm28BpPYia+UQ2LFYIkC9LL87SDRyPk+X+6uLx9uRuEyrSbuj4MesXOFZj8WQbGdmaDJZDzuykMCet88JKD0xxwcNxkoH2oN/N+prYFZ0xoYDa1Bo7Y2c4QLlkRi17LdBb+aoI2zZ7n+Mlgy+X0e5pBc4v+1Xf7nDUemv6jSb6u3Z91/l2WwMcPFDH40eKwonYbB2S0ZmlHAYA2ek8E98iyP3B9wMIXbGPyIGrb1DQJH9ejZ5Wz6gWPI+jl8y6gKT2Bh6tqWl2FVtDpWRdEu1DPaFQUOz640ihLa2MIo191X39EexuySRl2vWgOpG2UFWrIrezb+t2hXWtkG0oltkSWlf8YFDtC4NBwOa8W8gHOZl2bndoBC/k6J/9kxief7SfyC2Aj6yMbXNwjQSgRR98CCTiKI7FrzygjC7CKCKD5MoL6leBnxgNFDIyHn96bfTK/zhsNx7LWHq+u5YJTe/xVUuer/8+XEZZlxvNSi/mZmWc7Ey3ELVI3MGq3FX4M3ykfM0/hO0omNct3d6k0napqRK79d/f7h8vPDC6FX9pyzmG2dsUvNdzS3eMF7mBG8LO5Z+PV/G/+sw6vdA+eEkIve+TBb4qDBEGVhXxVktnm/LLnY5qk0zoSDw3EkZFkUe0EGkiQmUjKPhVEQuyw7wCCjZ3LYQR1FV4jNltg7vRriJKBjdMjVU0oVhj0/bYY4JSrUSM9CFOvBkzac7EErBC0WN1gwaoBSeXyDwBWhQuyK+CRJ4h/FKlU6SJk9OtR6URI/HfqyI78sPzSTey/F0ctQkXMnoTlLk2UVK+gxsvaqv7jooXu0QMFft6CI11iR+jNnRS1DMdtQN7ZTAvseduYX39NPfvM2b2Wk2KQE/Kmi1UGfUfEBxyq/o3t91fe6+8cvFeC4x6W9aEWYUNWpelwhjrPboPS1LJ+mnwU6vIjmAyNHVs53tdzNKgodgHR4b8tvkxOAwygwOUkZ3vwP</diagram></mxfile>

================================================
FILE: docs/faq/general.md
================================================
# General FAQ

## Overview

#### What is Revizor? {#what-is-revizor}

:   Revizor is a security-oriented fuzzer designed to detect microarchitectural information leaks in CPUs. It automatically generates random test programs, executes them on real hardware, and compares the observed behavior against a formal model to identify unexpected information leakage through side channels like those exploited by Spectre and Meltdown attacks.

#### Who is Revizor for? {#who-uses-revizor}

:   Revizor is primarily designed for CPU security researchers and hardware vendors interested in identifying and mitigating microarchitectural vulnerabilities. It may also be useful for system developers and security professionals who want to assess the security of the hardware platforms they work with.

#### How does Revizor differ from other hardware fuzzers (e.g., SiliFuzz)? {#how-does-revizor-differ-from-other-hardware-fuzzers}

:   Most of the existing hardware fuzzers focus on finding functional bugs, such as incorrect instruction execution or crashes. Revizor, on the other hand, is specifically designed to find security vulnerabilities related to microarchitectural side channels. It uses a model-based approach to define what information is allowed to leak and tests whether the CPU adheres to these specifications.

:   See [Revizor at a Glance](../intro/01-overview.md) for a more detailed introduction.

#### How is Revizor different from constant-time testing tools (e.g., Microwalk)? {#how-does-revizor-differ-from-ct-testing-tools}

:   Constant-time testing tools like Microwalk focus on verifying that software implementations do not leak sensitive information through timing variations. They analyze the execution of programs to ensure that their timing behavior is independent of secret data.

:   Revizor, in contrast, tests the CPU hardware itself for microarchitectural information leaks. It tests whether the CPU behaves as expected, regardless of the software running on it.

#### What CPUs does Revizor support? {#supported-cpus}

:   Revizor currently supports testing on x86-64 CPUs from Intel and AMD, as well as ARM CPUs.

#### Does Revizor detect only those leaks that are described in the contract? {#leaks-described-in-contract}

:   No! It is a common misconception that Revizor can only find leaks that are explicitly described in the contract. In reality, it is the opposite: The contract defines what the Revizor should *not* report as a leak, which allows the tool to filter out the known types of leakage and focus on finding unexpected leaks that violate the contract. This is how Revizor is able to discover new vulnerabilities even in completely black-box CPUs.

---

## Installing Revizor

#### What operating system is required to run Revizor? {#required-os}

:   You will need Linux.

#### Do I need a specific Linux distribution/version? {#specific-linux-distro}

:    No, Revizor should work on any reasonably recent Linux. If you encounter issues, that's most likely a bug that we would like to hear about. Please report any problems on our [GitHub Issues page](https://github.com/microsoft/side-channel-fuzzer/issues).

#### Does Revizor require root or administrator privileges? {#requires-root}

:   Yes. Revizor's executor is implemented as a kernel module that requires loading into the kernel and accessing hardware performance counters. Both operations require root privileges. Additionally, some system configuration steps recommended for optimal performance (like disabling hyperthreading) require administrative access.

#### Can I run Revizor in a virtual machines? {#run-on-vms}

:   Unfortunately, not. Revizor requires direct access to the CPU's PMU to accurately measure side-channel leakage. Running Revizor inside a virtual machine would introduce additional layers of abstraction and interference that could distort the measurements and lead to inaccurate results. You need to run Revizor on a bare-metal installation of Linux.

---

## Running Revizor

#### Can Revizor affect system stability? {#safety}

:   Although extremely unlikely, Revizor could potentially affect the host operating system. Revizor executes randomly-generated code in kernel space, which means that a misconfiguration or bug can crash the system and potentially lead to data loss. However, it does not intentionally perform any operations that would damage hardware.

:   You should never run Revizor on production machines or systems containing important data without backups. Always use a dedicated testing machine.

#### How long does it take to find a vulnerability? {#time-to-find}

:   This varies significantly, based on the complexity of the experiment. Typical numbers range from minutes to weeks.

#### Can Revizor test my own assembly programs or does it only generate random ones? {#test-custom-programs}

:   Yes, Revizor can test custom assembly programs using the `-t` flag. You can provide your own test case program in assembly format, and Revizor will execute it with randomly-generated inputs to check for contract violations. This is useful when you want to verify specific code patterns or investigate potential vulnerabilities in particular instruction sequences.

:   See the [CLI Reference](../ref/cli.md) for details on the `-t` option.

#### How much computational resources does a typical fuzzing campaign require? {#resource-requirements}

:   Resource requirements vary significantly based on the fuzzing configuration. A typical campaign runs continuously for hours to weeks. The primary variables affecting performance are the number of inputs per test case, sample sizes for hardware measurements, and the complexity of the ISA subset being tested. Larger sample sizes increase accuracy but reduce throughput. Most campaigns run on standard server or workstation hardware without specialized requirements beyond the supported CPU architecture.

:   See [How to Design a Fuzzing Campaign](../howto/design-campaign.md) for guidance on balancing performance and detection effectiveness.

---

## Violations

#### Are false positives common? How does Revizor handle them? {#false-positives}

:   No, unless it is misconfigured. Revizor uses a multi-stage filtering pipeline to eliminate false positives caused by noise and non-deterministic hardware behavior. This removes the vast majority of spurious violations. However, if Revizor is misconfigured (e.g., insufficient sample sizes), false positives can still occur due to noise in hardware measurements. These are relatively easy to identify as they tend to be unstable and non-reproducible.

:   See [How to Interpret Violation Results](../howto/interpret-results.md#evaluating-violation-quality) for guidance on evaluating violation quality and handling false positives.

#### Can Revizor automatically generate exploits or proof-of-concept code? {#generate-exploits}

:   No. Revizor detects violations of the leakage contract by identifying test cases where hardware behavior differs from the contract's predictions. While it provides the test program and inputs that trigger the violation, it does not automatically generate working exploits. The violation artifacts serve as evidence of unexpected leakage and a starting point for manual security analysis. You can use the minimization feature to simplify the test case, making it easier to understand and potentially develop into a proof-of-concept.

:   See [How to Minimize Test Cases](../howto/minimize.md) for details on simplifying violations.

#### How do I know if a detected violation is actually exploitable? {#exploitability}

:   Determining exploitability requires manual analysis of the violation. Start by reproducing the violation to confirm it's stable, then use the minimization feature to simplify the test case. Next, analyze the minimized program to understand what information is leaking and through which side channel. Root-cause analysis involves examining the assembly code, understanding the data dependencies, and determining whether an attacker could control the leaked information to extract sensitive data. Not all violations are practically exploitable, but all indicate deviation from the specified security contract.

:   See [How to Root-Cause a Violation](../howto/root-cause-a-violation.md) for systematic analysis techniques.

#### Is Revizor deterministic? Can I reproduce results? {#reproducibility}

:   Contract traces are fully deterministic—the same program with the same inputs always produces identical contract traces. Hardware traces, however, contain inherent non-determinism due to timing variations, cache state, and other microarchitectural effects. Revizor handles this through statistical analysis of multiple samples. Violations are reproducible when the same test program and inputs consistently show the same distributional differences in hardware traces. The violation artifact includes all necessary files (program, inputs, configuration) to reproduce detected violations, and Revizor provides a dedicated reproduce mode for verification.

:   See [Execution Modes](../ref/modes.md) for details on the reproduce mode.

---

## Development and Contribution

#### Is Revizor actively maintained? {#maintenance-status}

:   Yes. Revizor is actively maintained and continues to receive updates, bug fixes, and new features. The project has an active GitHub repository with recent commits and ongoing development.

#### Can I contribute to Revizor? {#contributing}

:   Yes, we welcome contributions from the community! You can contribute by reporting issues, suggesting new features, improving documentation, or submitting code changes through pull requests. Please refer to our [Contribution Guidelines](../internals/index.md) for instructions on how to get started.


================================================
FILE: docs/glossary.md
================================================
# Glossary

This glossary defines key terms used throughout the Revizor documentation. The entries are ordered in such a way that more fundamental concepts appear first, building up to more complex ideas. So, you can should be able to get a good understanding of the terminology by reading the glossary top-down.

---

####<a name="noninterference"></a>Noninterference
: A formal property that captures perfect confidentiality, stating that changes in secret data have no observable effect on public outputs. A program satisfies noninterference if variations in secret inputs cause no differences in public outputs. In Revizor's context, this property is checked with respect to side-channel observations and speculation contracts.

!!! info "Related Documentation"
    - [Primer: Information-Flow Properties](intro/03-primer.md#information-flow-properties)
    - [Primer: Noninterference Definition](intro/03-primer.md#noninterference-definition-and-examples)

---

####<a name="information-flow"></a>Information Flow
: The movement of data through a computation. Information-flow security is concerned with how data moves through a system and how it can be observed by an attacker. For example, if a program contains a data-dependent memory access `array[secret_index]`, the value of `secret_index` influences which memory location is accessed. In turn, if the attacker can observe the cache lines being accessed by this program, the execution of the array access will reveal (leak) information about `secret_index` through side channels. This creates an information flow from the secret data (`secret_index`) to the attacker's observations (cache state).

!!! info "Related Documentation"
    - [Primer: Information-Flow Properties](intro/03-primer.md#information-flow-properties)
    - [Primer: Side Channels](intro/03-primer.md#beyond-direct-outputs-side-channels)

---

####<a name="speculation-contract"></a>Speculation Contract (aka Leakage Contract)
: A formalization of how we expect the CPU to behave and what information we expect it to leak when any given program is executed. A simplified and deterministic model of CPU hardware designed to capture the information that a given program could leak over side channels when executed with given inputs. A speculation contract defines two key aspects for every instruction: an observation clause (describing what data is exposed) and an execution clause (describing how hardware optimizations like speculative execution affect the instruction). Speculation contracts intentionally overestimate possible leaks to ensure conservative and deterministic traces.

!!! info "Related Documentation"
    - [Topic: Contracts](topics/contracts.md)
    - [Primer: Speculation Contracts](intro/03-primer.md#speculation-contracts-dealing-with-the-complexity-of-modern-hardware)
    - [How-to: Choose a Contract](howto/choose-contract.md)

---

####<a name="observation-clause"></a>Observation Clause
: Part of a speculation contract that specifies what information an instruction exposes through side channels when executed. For example, an observation clause might specify that a load instruction exposes the memory address it accesses.

!!! info "Related Documentation"
    - [Topic: Contracts - Contract Structure](topics/contracts.md#contract-structure)
    - [Primer: Speculation Contracts](intro/03-primer.md#speculation-contracts-dealing-with-the-complexity-of-modern-hardware)

---

####<a name="execution-clause"></a>Execution Clause
: Part of a speculation contract that specifies how hardware optimizations (particularly speculative execution) affect an instruction's semantics. For example, an execution clause might specify that a conditional branch may mispredict its target and execute down the wrong path.

!!! info "Related Documentation"
    - [Topic: Contracts - Contract Structure](topics/contracts.md#contract-structure)
    - [Primer: Speculation Contracts](intro/03-primer.md#speculation-contracts-dealing-with-the-complexity-of-modern-hardware)

---

####<a name="leakage-model"></a>Leakage Model
: An implementation of a speculation contract. This model is used to compare the actual CPU behavior against the specification defined by the contract. It predicts what information flow is allowed through side channels for any given test case.

!!! info "Related Documentation"
    - [Topic: Leakage Models](topics/models.md)
    - [Internals: Model Architecture](internals/architecture/model.md)
    - [Internals: Unicorn Backend](internals/model-backends/model-unicorn.md)
    - [Internals: DynamoRIO Backend](internals/model-backends/model-dr.md)

---

####<a name="contract-trace"></a>Contract Trace (CTrace)
: The output of a leakage model. A CTrace is a recording of all exposed information when a given program is executed on the leakage model (e.g., a sequence of memory addresses accessed). This trace represents the expected information flow according to the contract.

!!! info "Related Documentation"
    - [Topic: Contracts - Contract Traces](topics/contracts.md#contract-traces)
    - [Topic: Leakage Models - Trace Representation](topics/models.md#trace-representation)
    - [Topic: Trace Analysis](topics/trace-analysis.md)

---

####<a name="executor"></a>Executor
: The component responsible for running programs on real hardware and collecting attacker-observable microarchitectural changes. This component acts as the counterpart to the leakage model; that is, while the model represents our expectations of the CPU behavior, the executor captures the actual behavior of the CPU under test.

!!! info "Related Documentation"
    - [Internals: Executor Architecture](internals/architecture/exec.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="hardware-trace"></a>Hardware Trace (HTrace)
: The output of the executor. An HTrace is a recording of microarchitectural state changes (like cache evictions, readings of the time stamp counter, etc.) observed during a program execution. These traces are used to capture the information flows on the CPU under test, both the expected and unexpected ones.

!!! info "Related Documentation"
    - [Topic: Trace Analysis](topics/trace-analysis.md)
    - [Internals: Executor Architecture](internals/architecture/exec.md)

---

####<a name="test-case-program"></a>Test Case Program
: A small assembly program, either generated automatically by Revizor or written manually by the user. Test case programs are intended to be executed on the target CPU to collect hardware traces, and on the leakage model to collect contract traces.

!!! info "Related Documentation"
    - [Topic: Test Case Generation](topics/test-case-generation.md)
    - [Internals: Code Generator Architecture](internals/architecture/code.md)
    - [Reference: Binary Formats - RCBF](ref/binary-formats.md)

---

####<a name="test-case-data"></a>Test Case Data (aka Test Case Input)
: A blob of data used to initialize memory and registers for the execution of a test case program. Test case data can be generated automatically by Revizor or provided manually by the user.

!!! info "Related Documentation"
    - [Topic: Test Case Generation](topics/test-case-generation.md)
    - [Internals: Data Generator Architecture](internals/architecture/data.md)
    - [Reference: Binary Formats - RDBF](ref/binary-formats.md)

---

####<a name="sandbox"></a>Sandbox (or Test Case Sandbox)
: An isolated execution environment where test case programs are run on the target CPU and on the model. On the technical level, a sandbox constitutes of a dedicated region of memory where the test case program and data are loaded, as well as a set of mechanisms to isolate the test case execution from the rest of the system (e.g., by disabling interrupts, overriding MSRs, etc.).

!!! info "Related Documentation"
    - [Reference: Sandbox](ref/sandbox.md)
    - [Reference: Registers](ref/registers.md)

---

####<a name="model-based-relational-testing"></a>Model-based Relational Testing (MRT)
: The core methodology of Revizor. It involves randomly generating test programs and inputs to them, executing them with the executor and the model, collecting the corresponding hardware and contract traces, identifying the information flows in both, and comparing them to find unexpected leaks.

!!! info "Related Documentation"
    - [Primer: Model-Based Relational Testing](intro/03-primer.md#model-based-relational-testing-and-revizor)
    - [Topic: Trace Analysis](topics/trace-analysis.md)
    - [Internals: Fuzzer Architecture](internals/architecture/fuzz.md)

---

####<a name="violation"></a>Violation
: A situation where hardware traces expose some information that is not exposed in the contract traces for the same test case. This indicates that the CPU is leaking some information not specified by the contract, which may represent a security vulnerability.

!!! info "Related Documentation"
    - [Topic: Trace Analysis](topics/trace-analysis.md)
    - [Primer: Contract Violation](intro/03-primer.md#building-and-testing-speculation-contracts)
    - [How-to: Root-Cause a Violation](howto/root-cause-a-violation.md)

---

####<a name="violation-artifact"></a>Violation Artifact (aka Contract Counterexample)
: A bundle consisting of a test case program, two inputs that trigger the violation (plus extra inputs to set the uarch state, if needed), the corresponding hardware and contract traces, and a collection of configuration files to reproduce the violation. Violation artifacts are generated automatically by Revizor when a violation is detected.

!!! info "Related Documentation"
    - [Reference: Binary Formats](ref/binary-formats.md)
    - [How-to: Root-Cause a Violation](howto/root-cause-a-violation.md)
    - [How-to: Minimize Test Cases](howto/minimize.md)

---

####<a name="minimization"></a>Minimization
: A post-processing mode that takes a violation artifact and performs transformation passes to simplify the program and data while preserving the violation. The goal is to produce a minimal artifact that is easier to understand and analyze, using program passes (instruction removal/simplification), input passes (sequence/diff minimization), and analysis passes (source analysis).

!!! info "Related Documentation"
    - [How-to: Minimize Test Cases](howto/minimize.md)
    - [Reference: Minimization Passes](ref/minimization-passes.md)
    - [Internals: Minimization Architecture](internals/architecture/mini.md)

---

####<a name="multi-stage-filtering"></a>Multi-stage Filtering
: A pipeline of validation stages applied to potential violations to rule out false positives. A violation must survive all stages to be reported.

!!! info "Related Documentation"
    - [Internals: Fuzzer Architecture](internals/architecture/fuzz.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="priming-test"></a>Priming Test
: One of the most important validation stages. It is motivated by the following problem: when hardware traces are collected for a sequence of many inputs, the execution of the program with earlier inputs will affect the microarchitectural state for later inputs (e.g., the branch predictor state). This can lead to false positives, where two inputs that should be indistinguishable according to the contract produce different hardware traces simply because they were executed in different microarchitectural states (e.g., one input triggered a misprediction while the other did not). These case don't actually represent a violation because the difference in traces is not caused by the data difference, but rather by the sequence of executions.

The priming test mitigates this problem by re-executing the violating inputs in a different sequence, by swapping the order of inputs that trigger a violation. If the violation disappears when the order is swapped, it indicates that the difference in traces was due to inconsistent microarchitectural state rather than a true violation. Otherwise, we have evidence that the violation is genuine.

!!! info "Related Documentation"
    - [Reference: Configuration Options - enable_priming](ref/config.md#enable_priming)
    - [Internals: Fuzzer Architecture](internals/architecture/fuzz.md)

---

####<a name="contract-compliance"></a>Contract Compliance
: A CPU complies with a speculation contract if, for all possible programs and input pairs that produce identical contract traces, the corresponding hardware traces are also identical. This ensures that the contract captures all information that the hardware can leak. While testing all possible programs is infeasible, Revizor approximates this by randomly sampling the search space with a large number of test cases.

!!! info "Related Documentation"
    - [Topic: Trace Analysis - Contract Compliance Property](topics/trace-analysis.md#contract-compliance-property)
    - [Topic: Contracts - Contract Compliance](topics/contracts.md#contract-compliance)
    - [Primer: Contract Compliance](intro/03-primer.md#building-and-testing-speculation-contracts)

---

####<a name="contract-equivalence-class"></a>Contract Equivalence Class (ContractEqClass)
: A group of inputs that produce identical contract traces for a given test case program. According to the leakage model, these inputs should be indistinguishable when executed.

!!! info "Related Documentation"
    - [Topic: Trace Analysis - Deterministic Trace Comparison](topics/trace-analysis.md#deterministic-trace-comparison)
    - [Internals: Analyser Architecture](internals/architecture/analysis.md)

---

####<a name="hardware-equivalence-class"></a>Hardware Equivalence Class (HardwareEqClass)
: A group of inputs that produce statistically similar hardware traces for a given test case program. These inputs are actually indistinguishable on real hardware.

!!! info "Related Documentation"
    - [Topic: Trace Analysis - Statistical Trace Comparison](topics/trace-analysis.md#statistical-trace-comparison)
    - [Internals: Analyser Architecture](internals/architecture/analysis.md)

---

####<a name="boosting"></a>Boosting (aka Contract-driven Input Generation)
: A data generation optimization technique that uses taint analysis to generate inputs more likely to trigger contract violations. The boosted generator identifies which input bytes affect the contract trace and generates new inputs by mutating the non-tainted bytes. This way, we can deterministically and efficiently create any number of inputs that produce the same contract trace (i.e., form one ContractEqClass), increasing the chances of finding violations.

!!! info "Related Documentation"
    - [Internals: Data Generator Architecture](internals/architecture/data.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="fuzzer"></a>Fuzzer
: The main orchestrator in Revizor that manages core components (CodeGenerator, DataGenerator, Model, Executor, and Analyser) and coordinates the fuzzing loop. When a potential violation is found, the Fuzzer runs it through a multi-stage filtering pipeline to eliminate false positives.

!!! info "Related Documentation"
    - [Internals: Fuzzer Architecture](internals/architecture/fuzz.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="analyser"></a>Analyser
: The component that compares contract traces with hardware traces to detect violations. It uses an equivalence class approach where it groups inputs by contract traces (ContractEqClasses) and then checks if they split into multiple hardware equivalence classes (HardwareEqClasses), which would indicate a violation.

!!! info "Related Documentation"
    - [Topic: Trace Analysis](topics/trace-analysis.md)
    - [Internals: Analyser Architecture](internals/architecture/analysis.md)
    - [Reference: Configuration Options - analyser](ref/config.md)

---

####<a name="actor"></a>Actor
: A partition of the sandbox representing a distinct execution context with specific isolation properties (e.g., a VM). An actor encompasses a code region, a data region with configurable permissions, and an execution context (CPU mode, privilege level, and system configuration). Actors enable testing for information leaks across different security domains.

!!! info "Related Documentation"
    - [Topic: Actors](topics/actors.md)
    - [Reference: Sandbox](ref/sandbox.md)

---

####<a name="actor-non-interference"></a>Actor Non-Interference
: A specialized type mode of testing in Revizor, where, on top of testing for standard contract violations, the tool also checks that there are no information flows between different actors in a multi-actor test case. This mode is used to verify isolation properties between security domains, ensuring that secret data in one actor does not influence observable behavior in another actor.

!!! info "Related Documentation"
    - [Topic: Actors](topics/actors.md)

---

####<a name="observer-actor"></a>Observer Actor
: An actor marked as an observer in the configuration, representing an attacker that can observe data leaks in multi-actor testing scenarios. This is used in conjunction with the Actor Non-Interference mode to check that secret data in other actors does not influence the traces in the observer actor.

!!! info "Related Documentation"
    - [Topic: Actors](topics/actors.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="rcbf"></a>RCBF (Revizor Code Binary Format)
: A custom binary format used to transfer test case programs between Revizor components. The format contains a header, actor table, symbol table, metadata, and code sections for each actor.

!!! info "Related Documentation"
    - [Reference: Binary Formats - RCBF](ref/binary-formats.md)

---

####<a name="rdbf"></a>RDBF (Revizor Data Binary Format)
: A custom binary format used to transfer input data between Revizor components. The format contains initialization data for sandbox memory and registers, and can combine multiple inputs into a single file for batch processing.

!!! info "Related Documentation"
    - [Reference: Binary Formats - RDBF](ref/binary-formats.md)

---

####<a name="template"></a>Template
: An assembly file that combines regular assembly instructions with placeholders to define a test case structure for the code generator. Such templates are used in a special template mode of Revizor, where the programs are generated by populating the placeholders with random instructions instead of generating programs from scratch.

!!! info "Related Documentation"
    - [How-to: Use Templates](howto/use-templates.md)
    - [Reference: Configuration Options](ref/config.md)

---

####<a name="macro"></a>Macro
: A special pseudo-instruction in test case programs that can be treated differently depending on whether the test case is executed by the model or the executor. One prominent example is VM transition macros, which handle switching between actors. A special type of macro is also used to implement the placeholders in templates.

!!! info "Related Documentation"
    - [How-to: Use Macros](howto/use-macros.md)
    - [Reference: Macro Reference](ref/macros.md)

---


================================================
FILE: docs/howto/ask-a-question.md
================================================
# Ask a Question

If you have a question about Revizor, there are several ways to reach out to us:

* For **any questions, no matter how big or small,** feel free to post them in our community [Zulip chat](https://rvzr.zulipchat.com/) where the community and developers can assist you.
* Alternatively, you can start a discussion on our [GitHub Discussions page](https://github.com/microsoft/side-channel-fuzzer/discussions) (this is preferable for longer questions that may require more in-depth answers).

Bug reports should be submitted to our [GitHub Issues page](https://github.com/microsoft/side-channel-fuzzer/issues).

For general information about Revizor, please refer to our [FAQ](../faq/general.md) page.


================================================
FILE: docs/howto/choose-contract.md
================================================
# How to Choose a Contract

This guide helps you select the appropriate [contract](../glossary.md#speculation-contract) for your fuzzing campaign. The contract determines which microarchitectural leaks Revizor will report as violations, making it a critical configuration choice that affects both what you find and how efficiently you find it.

!!! note "Prerequisites"
    Before choosing a contract, you should understand what contracts are and how they work. Read the [Contracts](../topics/contracts.md) topic guide if you need background on contract structure and purpose.


## Standard Fuzzing with CT-SEQ

Use CT-SEQ for most fuzzing campaigns. This contract assumes nothing about the target CPU except the presence of CPU caches, making it a zero-knowledge baseline for detecting unknown vulnerabilities. With CT-SEQ, Revizor reports any information leaks beyond the most trivial non-speculative cache accesses.

Configure CT-SEQ by setting the [observation clause](../glossary.md#observation-clause) to `ct` and the [execution clause](../glossary.md#execution-clause) to `seq`:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - seq
```

CT-SEQ provides the strictest security guarantees and will detect the widest range of vulnerabilities. Start with this contract unless you have specific reasons to use a different one.

## Continuing After Finding a Violation

When you find a violation with CT-SEQ and want to continue testing for additional vulnerabilities, you have two approaches.

The simpler and more efficient approach is to blocklist the instruction that triggered the violation. Use the [`instruction_blocklist_append`](../ref/config.md#instruction_blocklist_append) configuration option to exclude specific instructions from testing. For example, if a branch misprediction caused the violation, blocklist all conditional branch instructions:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - seq
instruction_blocklist_append:
  - jne
  - je
  # add other branch instructions
```

This approach lets you continue using CT-SEQ's fast and efficient detection while avoiding repeated reports of the same root cause.

Alternatively, you can incorporate the newly discovered speculation source into the contract by switching to a different execution clause. For violations caused by branch mispredictions, switch to the COND execution clause:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - cond
```

The CT-COND contract models speculative execution from branch mispredictions as expected behavior. Revizor will no longer report violations from this source, allowing you to search for other types of leaks in the same instruction set.

## Testing with Exceptions

If your fuzzing campaign includes code that may raise exceptions such as page faults or general protection faults, these exceptions will likely cause trivial violations under CT-SEQ. Modern CPUs implement out-of-order execution, which means instructions after a faulting instruction may begin executing before the CPU recognizes the exception. These subsequent instructions can leak information not predicted by CT-SEQ's strictly sequential model.

These violations typically represent known artifacts of out-of-order execution rather than genuine security issues. To suppress such trivial reports, use the CT-DEH contract instead. This contract models delayed exception handling, allowing instructions after a faulting instruction to execute transiently before the exception is handled:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - deh
```

CT-DEH remains strict about other speculation sources while accommodating the expected behavior around exceptions.

## Testing Cross-Domain Isolation

When testing isolation between security domains such as kernel versus user mode or host versus guest execution, use the Actor Non-Interference contract (CT-NI). This contract changes the security property being tested. Instead of only checking that inputs with identical [contract traces](../glossary.md#contract-trace) produce equivalent [hardware traces](../glossary.md#hardware-trace), CT-NI adds an additional requirement: the hardware traces observed by attacker actors must not depend on data from victim actors.

Configure CT-NI with the following observation clause:

```yaml
contract_observation_clause: ct-ni
```

You must also configure actors properly, designating which actors are observers (attackers) and which are victims. See [Actors](../topics/actors.md) for details on actor configuration.

## Investigating Known Vulnerabilities

When investigating variants of known vulnerabilities, use a contract that models the specific vulnerability class you are studying.

For Spectre V1 variant analysis, use the COND execution clause to model branch mispredictions as expected behavior:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - cond
```

This configuration lets you explore whether other instructions or gadget patterns can be exploited through branch misprediction without being distracted by the original Spectre V1 finding.

For other vulnerability classes, choose the execution clause that models the corresponding speculation mechanism. See the [Configuration Reference](../ref/config.md#contract_execution_clause) for a list of available execution clauses and their intended use cases.

## What's Next?

- Topic: [Contracts](../topics/contracts.md) - Understanding contract structure and behavior
- How-to: [Design a Fuzzing Campaign](design-campaign.md) - Complete campaign planning including contract selection
- Reference: [Configuration Options](../ref/config.md) - Complete list of contract and configuration parameters
- Glossary: [Contract](../glossary.md#speculation-contract), [Observation Clause](../glossary.md#observation-clause), [Execution Clause](../glossary.md#execution-clause)


================================================
FILE: docs/howto/design-campaign.md
================================================
# How to Design a Fuzzing Campaign

This guide shows you how to design and configure a fuzzing campaign for detecting speculative execution vulnerabilities. A campaign consists of three components: a configuration file (YAML), command-line arguments, and optionally a template file (ASM).

!!! note "Prerequisites"
    - Revizor installed and the executor kernel module loaded
    - Basic understanding of [contracts](../topics/contracts.md) and what you want to test

## Select Instruction Set

Choose which instruction subset to test. Smaller subsets are more effective because violations are found faster and root-cause analysis is simpler. For comprehensive ISA coverage, split testing into multiple targeted campaigns rather than running a single large campaign.

Specify instruction categories in your configuration file using `instruction_categories`:

```yaml
instruction_categories:
  - BASE-BINARY      # arithmetic instructions
  - BASE-STRINGOP    # string operations
  - BASE-LOGIC       # logical operations
```

Verify which instructions are included by enabling debug logging:

```yaml
logging_modes: ['info', 'stat', 'dbg_generator']
```

For fine-grained control over the instruction set, see the [Configuration Reference](../ref/config.md#instruction_categories).

## Configure Exception Testing

Enable exception testing using the `faults_allowlist` option:

```yaml
faults_allowlist:
  - div-by-zero              # division by zero exceptions
```

Ensure the corresponding instructions are included in your instruction set. For example, `div-by-zero` requires division instructions in the tested pool.

For testing Meltdown or Foreshadow-like vulnerabilities, configure memory access permissions through actor-specific `data_properties` and `data_ept_properties`:

```yaml
actors:
  - main:
      data_properties:
        present: false     # trigger page faults
        writable: false    # trigger write protection faults
```

See the [Sandbox Reference](../ref/sandbox.md) for details on memory permissions and the [Configuration Reference](../ref/config.md#faults_allowlist) for all exception handling options.

## Configure Actors for Multi-Domain Testing

For cross-domain leakage testing, define [actors](../glossary.md#actor) to represent different security domains:

```yaml
actors:
  - main:
      mode: host
      privilege_level: kernel
  - guest:
      mode: guest
      privilege_level: kernel
      observer: true
```

Create corresponding template files to specify transition sequences between actors. See [Actors](../topics/actors.md) for detailed instructions.

## Select Contract

Choose a [contract](../glossary.md#speculation-contract) that defines what execution behavior constitutes a violation. Contract selection depends on whether you are testing cross-domain leakage and which known vulnerabilities you want to filter out.

For detailed guidance on selecting the appropriate contract for your testing scenario, see [How to Choose a Contract](choose-contract.md).

Example configuration:

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - seq
```

See the [Configuration Reference](../ref/config.md#contract_observation_clause) for all available contract options.

## Configure Noise Threshold

Adjust noise tolerance based on your system characteristics. Higher thresholds and larger sample sizes reduce false positives but may miss subtle leaks and decrease performance. Lower thresholds increase sensitivity but may produce false positives on noisy systems.

For high-noise systems:

```yaml
analyser_stat_threshold: 0.5      # conservative threshold
executor_sample_sizes: [50, 100, 500, 1000]
```

For low-noise systems:

```yaml
analyser_stat_threshold: 0.1      # sensitive threshold
executor_sample_sizes: [10, 50, 100]
```

Start with low-noise settings and increase thresholds if you encounter non-reproducible violations. See the [Trace Analysis Guide](../topics/trace-analysis.md#statistical-trace-comparison) for more information on noise handling.

## Enable Reproducibility

Set deterministic seeds to make the campaign reproducible:

```yaml
program_generator_seed: 12345     # deterministic program generation
data_generator_seed: 67890        # deterministic input generation
```

Reproducible campaigns are essential for debugging and comparing results across different runs.

## Configure Test Case Shape

Control the structure of generated test cases:

```yaml
program_size: 64                  # instructions per program
avg_mem_accesses: 32              # average memory accesses
min_bb_per_function: 1            # minimum basic blocks per function
max_bb_per_function: 2            # maximum basic blocks per function
min_successors_per_bb: 1          # minimum successors per basic block
max_successors_per_bb: 1          # maximum successors per basic block
```

Larger programs may find more complex interactions but require longer analysis time. Start with smaller programs and increase size if needed.

## Use Templates for Targeted Testing

Use templates when targeting specific microarchitectural scenarios. Templates define fixed assembly structures with random instruction insertion, allowing you to focus on specific patterns while maintaining variability.

Example template:

```asm
.section .data.main
.function_main_0:
    # Fixed initialization
    mov rax, 0

    # Random instruction sequence
    .macro.random_instructions.32.0:

    # Fixed measurement
    .macro.measurement_start:
    mov rbx, [r14]
    .macro.measurement_end:

.test_case_exit:
```

See [How to Use Templates](use-templates.md) for detailed template syntax and the [Macro Reference](../ref/macros.md) for available macros.

## Complete Example

This campaign tests whether division-by-zero exceptions cause unexpected information leakage on the target CPU. It focuses on simple arithmetic instructions to isolate exception handling behavior and answers the question: "Does division by zero on this CPU leak information through microarchitectural side channels?"

The configuration assumes a CPU with relatively low non-determinism, using moderate sample sizes and a conservative statistical threshold. The campaign uses the DEH (Delay Exception Handling) contract to filter out trivial cases of out-of-order handling of the exception. Test cases are kept small (32 instructions, no branches) to simplify analysis and accelerate violation detection. Each campaign iteration generates 100 different inputs per test case to explore various data-dependent behaviors around division operations.

```yaml
# Instruction selection
instruction_categories:
  - BASE-BINARY

# Exception handling
faults_allowlist:
  - div-by-zero

# Contract
contract_observation_clause: ct
contract_execution_clause:
  - deh

# Noise handling
analyser_stat_threshold: 0.2
executor_sample_sizes: [10, 50, 100, 500]

# Reproducibility
program_generator_seed: 12345
data_generator_seed: 67890

# Test case shape: 32 instructions with no branches
program_size: 32
avg_mem_accesses: 16
min_bb_per_function: 1
max_bb_per_function: 1

# Single actor
actors:
  - main:
      mode: host
      privilege_level: kernel
      data_properties:  # no page faults
        present: true
        writable: true

# Debugging
logging_modes: ['info', 'stat', 'dbg_generator']
```

Launch the campaign:

```bash
rvzr fuzz -s base.json -c config.yaml -n 100000 -i 100 -w ./violations --timeout 3600
```


## What's Next?

- How-to: [Choose a Contract](choose-contract.md) - Select the appropriate contract for your testing scenario
- How-to: [Use Templates](use-templates.md) - Create targeted test cases
- How-to: [Interpret Results](interpret-results.md) - Understand fuzzing output
- Topic: [Actors](../topics/actors.md) - Configure multi-domain testing
- Topic: [Contracts](../topics/contracts.md) - Understanding leakage contracts
- Topic: [Test Case Generation](../topics/test-case-generation.md) - How test cases are generated
- Reference: [Configuration Options](../ref/config.md) - Complete configuration reference
- Reference: [CLI Reference](../ref/cli.md) - Command-line interface reference


================================================
FILE: docs/howto/interpret-results.md
================================================
# How to Interpret Violation Results

So you've run a fuzzing campaign and found a violation. Now what?

This guide will help you understand and validate violations detected by Revizor. This guide explains the structure of violation artifacts, how to reproduce violations, and how to interpret the output to determine whether a violation is genuine and worth investigating.

!!! info "Prerequisites"
    Before starting, ensure you have:

    - Revizor installed and functional on the target system
    - A violation directory (`violation-<timestamp>`) produced during fuzzing
    - The configuration file (`config.yaml`) used in the original fuzzing campaign
    - Access to the same hardware where the violation was detected

## Violation Message

When Revizor detects a violation during fuzzing, it prints a summary message to the console similar to this:

```plaintext
(venv-3.12) main ➜  revizor ./revizor.py fuzz -s base.json -c demo/detect-v1.yaml -n 1000 -i 100 -w ./

INFO: [prog_gen] Setting program_generator_seed to random value: 599740

INFO: [fuzzer] Starting at 15:39:42
17    ( 2%)| Stats: Cls:0/0,In:200,R:7,SF:10,OF:7,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0,V:0> Priming  27             . to 500

================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:92  | ID:192|
-----------------------------------------------------------------------------------
^...^...................^...........^.........^................. | 497    | 0     |
^...^........................................................... | 3      | 2     |
^^..^...........................................^.........^..... | 0      | 498   |


================================ Statistics ===================================

Test Cases: 18
Inputs per test case: 200.0
Violations: 1
Effectiveness:
  Total Cls: 98.0
  Effective Cls: 98.0
Discarded Test Cases:
  Speculation Filter: 10
  Observation Filter: 7
  Fast Path: 0
  Max Nesting Check: 0
  Tainting Check: 0
  Early Priming Check: 0
  Large Sample Check: 0
  Priming Check: 0

Duration: 40.5
Finished at 15:40:23
```

Most of the output is statistics, and they are mostly irrelevant for interpreting the violation itself. You can find a detailed explanation of the runtime statistics in the [Statistics Reference](../ref/runtime-statistic.md).

The relevant part for interpreting the violation is the `Violation Details` section:

```
-----------------------------------------------------------------------------------
                             HTrace                              | ID:92  | ID:192|
-----------------------------------------------------------------------------------
^...^...................^...........^.........^................. | 497    | 0     |
^...^........................................................... | 3      | 2     |
^^..^...........................................^.........^..... | 0      | 498   |
```

This section summarizes the hardware trace samples recorded for the inputs that triggered the violation.

Let's break it down.

### Violating Inputs

```
| ID:92  | ID:192|
```

This block tells us which inputs produced the violation. In this case, it's inputs 92 and 192. You can find them in the violation artifact directory as `input_92.bin` and `input_192.bin`.

### Hardware Traces

```
^...^...................^...........^.........^.................
^...^...........................................................
^^..^...........................................^.........^.....
```

This block shows a visual representation of all observed hardware traces for these inputs. In this example, we used Revizor's default P+P (Prime+Probe) cache side channel tracer, which records the state of L1D cache after a test case execution. The `^` character indicates that a cache line was accessed (evicted by the test case program), while the `.` character indicates that the cache line was not accessed. The complete line is a bitmap of all 64 L1D cache sets available on the target machine, numbered left to right from 0 to 63.

Accordingly, the first line is interpreted as follows:

```

    Set 4 accessed                  Set 36 accessed
    |                               |         Set 46 accessed
    |                               |         |
^...^...................^...........^.........^.................
|                       |
Set 0 accessed          Set 24 accessed
```

meaning that cache sets with IDs 0, 4, 24, 36, and 46 were accessed in this hardware trace.


!!! tip "Colors!"
    Enable `color: true` in the configuration file to improve readability of hardware trace visualizations.

### Trace Distribution

```
... | 497    | 0     |
... | 3      | 2     |
... | 0      | 498   |
```

Finally, this block shows the [statistical distribution](../topics/trace-analysis.md#statistical-trace-comparison) of hardware traces for each input. For example, input 92 produced the first hardware trace 497 times (out of the total of 500 measurements), while input 192 never produced that trace. Instead, input 192 produced the third hardware trace 498 times.

### Analysis

By looking at this table, we can deduce two important facts about the violation:

1. There is a clear difference in the sample distributions for the two inputs. This indicates a genuine violation rather than random noise.
2. The dominant (most frequently observed) hardware trace for each input have evicted distinct sets of cache lines. This is an indirect clue that the test case had a data-dependent memory accesses pattern that was not predicted by the contract (likely due to speculative execution).

## Violation Artifact

When Revizor detects a violation, it creates a directory named `violation-<timestamp>`, with the following structure:

```
violation-<timestamp>/
├── program.asm
├── input_0.bin
├── input_1.bin
├── ...
├── report.txt
├── org-config.yaml
├── reproduce.yaml
└── minimize.yaml
```

 The `program.asm` file holds the test case program that triggered the violation. The `input_*.bin` files contain the input sequence that exposed the leak. The `report.txt` file provides additional details including hardware and contract traces. The configuration files include `org-config.yaml` (the original configuration), `reproduce.yaml` (for reproducing the violation), and `minimize.yaml` (for test case minimization).

Before proceeding with analysis, locate this directory and verify that all required files are present.

## Reproducing the Violation

It is usually a good idea to first reproduce the violation outside of the fuzzing campaign. This confirms that the violation is stable and not a transient artifact of noise or a misconfiguration of the fuzzer.

```bash
rvzr reproduce -s base.json -c ./violation-<timestamp>/reproduce.yaml \
    -t ./violation-<timestamp>/program.asm -i ./violation-<timestamp>/input_*.bin
```

If Revizor prints "Violation detected" in the output, the violation reproduced successfully. The distribution of hardware traces should roughly match the original violation. Significant differences may indicate a bug or misconfiguration in the fuzzer (e.g., random seeds).

Non-reproducible violations should be rare, typically no more than one or two per machine per week of fuzzing. If your campaign produces more, adjust the configuration file to increase noise tolerance. See the [configuration options reference](../ref/config.md) for details on noise-related parameters.


## Evaluating Violation Quality

Several factors determine whether a violation is worth investigating further.

*Reproducibility* is the most important criterion. Violations that consistently reproduce across multiple runs indicate stable, genuine leaks. Sporadic violations that appear and disappear may be false positives caused by noise. In such cases, consider adjusting noise tolerance settings ([`analyser_stat_threshold`](../ref/config.md#analyser_stat_threshold) and/or [`executor_sample_sizes`](../ref/config.md#executor_sample_sizes)) in the configuration file and rerunning the fuzzing campaign.

*Trace distribution* provides additional insight. Clean violations show clear separation between inputs with consistent occurrence counts. Messy violations with overlapping traces or highly variable counts suggest non-determinism and may be harder to analyze. In such cases, consider collecting more samples per input by increasing the [`executor_sample_sizes`](../ref/config.md#executor_sample_sizes) configuration option (note: this will slow down fuzzing).

Finally, *the hardware trace pattern* can be informative as well. There is no hard rule here, but if you see lots of accessed cache sets while the configuration is supposed to limit the number of memory accesses to only a few, that may indicate that some CPU feature creates additional noise, beyond the ability of the statistical analyzer to filter it out. In practice, this is often due to prefetchers. It is typically a good idea to disable them, unless you are specifically testing for prefetcher-related leaks.

## Next Steps

Once you have confirmed that a violation is reproducible and worth investigating, proceed to minimize the violation artifacts and root-cause the leak. See the [How to Minimize Test Cases](minimize.md) and [How to Root-Cause a Violation](root-cause-a-violation.md) guides for detailed instructions.

## See Also

- [How to Root-Cause a Violation](root-cause-a-violation.md) - Systematic analysis of confirmed violations
- [How to Design a Fuzzing Campaign](design-campaign.md) - Tuning fuzzer parameters for better results
- [How to Minimize Test Cases](minimize.md) - Simplifying violation artifacts for analysis
- [Configuration Options](../ref/config.md) - Detailed configuration parameter reference
- [Execution Modes](../ref/modes.md) - Understanding reproduce mode and other execution modes
- [Trace Analysis and Violation Detection](../topics/trace-analysis.md) - How Revizor detects and analyzes violations
- [Contracts and Leakage Models](../topics/contracts.md) - Understanding contract semantics


================================================
FILE: docs/howto/minimize.md
================================================
# How to Minimize Test Cases

This guide discussed a process of test case minimization, which aims to reduce complexity of violation artifacts by simplifying test programs and input sequences while preserving the violation. This is typically a post-processing step performed after a fuzzing campaign has detected a violation, with the goal of producing a minimal test case suitable for human analysis and root-cause investigation.

The minimization is done by using Revizor's `minimize` mode, which post-processes a violation through a series of transformation passes that simplify both the test program and input sequence.

!!! note "Related Documentation"
    For a complete list of available passes and their detailed descriptions, see the [Minimization Passes reference](../ref/minimization-passes.md).

!!! info "Prerequisites"
    Before starting, ensure you have:

    - Revizor installed and functional on the target system
    - A violation directory (`violation-<timestamp>`) produced during fuzzing
    - The configuration file (`config.yaml`) used in the original fuzzing campaign
    - Access to the same hardware where the violation was detected

## Basic Usage

Run the minimizer with the following syntax:

```bash
rvzr minimize -s <spec_file> -c <config_file> -t <program_file> -o <output_file> \
    -i <num_inputs> --input-outdir <input_outdir> --num-attempts <num_attempts> \
    [pass_options]
```

Parameters:

- `-s`: Path to ISA specification (e.g., `base.json`)
- `-c`: Path to configuration file (typically `minimize.yaml` from violation directory)
- `-t`: Path to test program (typically `program.asm` from violation directory)
- `-o`: Output path for minimized program
- `-i`: Number of inputs in the sequence (must match the original fuzzing campaign)
- `--input-outdir`: Directory to store minimized input files
- `--num-attempts`: Number of minimization iterations to perform
- `[pass_options]`: Enable specific minimization passes (see [Minimization Passes](../ref/minimization-passes.md))

Example command (assuming a violation directory named `violation-0000-0000`):

```bash
rvzr minimize -s base.json -c violation-0000-0000/minimize.yaml -t violation-0000-0000/program.asm \
    -i 25 --input-outdir ./min-inputs --num-attempts 10 --enable-instruction-pass 1 \
    -o min.asm
```

This command generates an input sequence of 25 inputs based on the seed in `violation-0000-0000/minimize.yaml`, applies the instruction removal pass 10 times to simplify `program.asm`, and writes the minimized program to `min.asm`. The simplified input sequence is stored in `./min-inputs`.

## Interpreting the Output

Each minimization pass prints progress indicators to the console as it executes. Understanding this output helps verify that minimization is progressing correctly.

### Program Pass Output

Program passes display one character per instruction to indicate success or failure:

- `.` indicates the pass succeeded on this instruction (e.g., instruction was successfully removed)
- `-` indicates the pass failed on this instruction (e.g., removing this instruction breaks the violation)

Example output when running `--enable-instruction-pass`:

```
[Pass 2] Instruction Removal Pass

.............-.....--.-------..----
```

Interpret this output by reading from right to left, since the pass iterates from the end of the program to the beginning. In this example, the pass successfully removed the last 13 instructions, failed on the 14th instruction from the end, succeeded on the 15th, and so on.

### Input Pass Output

The `input-diff` pass uses a memory-map visualization to show minimization progress. Each character represents one byte in the input sequence:

- `.` indicates zeroing the byte succeeded
- `+` indicates copying the byte from the first input to the second succeeded
- `=` indicates the byte was already identical in both inputs
- `^` indicates the pass could not minimize this byte (it remains different between inputs)

Example output from `--enable-input-diff-pass`:

```
Address    +0x0     +0x40    +0x80    +0xc0    +0x100   +0x140   +0x180   +0x1c0
0x00000000 ........ ........ ........ ........ ........ ........ ........ ........
0x00000200 ........ ........ ........ ........ ........ ........ ........ ........
0x00000400 ........ ........ ........ ........ ........ ........ ........ ........
0x00000600 ........ ........ ........ ........ ........ ........ ........ ........
0x00000800 ........ ........ ........ ........ ........ ........ ........ ........
0x00000a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001000 ........ ........ ........ ........ ........ ........ ........ ........
0x00001200 ........ ........ ........ ........ ........ ........ ........ ........
0x00001400 ........ ........ ........ ........ ........ ........ ........ ........
0x00001600 ........ ........ ........ ........ ........ ........ ........ ........
0x00001800 ........ ........ ........ ........ ........ ........ ........ ........
0x00001a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00002000 ====^=..
0x00002040 ........ ........ ........ ........
  > Result: Leaked 1 bytes
  > Addresses: ['0x2020']
```

This output shows that the pass successfully minimized most input differences. The byte at address `0x2020` (marked with `^`) remains different between the two inputs and likely contributes to the violation. Bytes at addresses `0x2000-0x2018` and `0x2028` (marked with `=`) were already identical.

### Comment Pass Output

Enable `--enable-comment-pass` to annotate the minimized program with analysis information. The pass inserts comments indicating which memory accesses contributed to the violation, making it easier to identify the root cause.

Comment format:

```
# mem access: [input1_id] [load_addr]-[store_addr]
  CL [cache_set_id]:[cache_line_offset] | [input2_id] [load_addr]-[store_addr]
  CL [cache_set_id]:[cache_line_offset]
```

Each comment shows the memory addresses accessed by an instruction when executed with the two inputs that triggered the violation. The comment includes both virtual addresses and their corresponding L1D cache set IDs and line offsets.

Example comment:

```asm
# mem access: [1] 0x800-0x800 CL 32:0 | [11] 0x710-0x710 CL 28:10
```

This indicates that when executed with input 1, the instruction accessed address `0x800` (cache set 32, offset 0), and when executed with input 11, it accessed address `0x710` (cache set 28, offset 10). These different cache set accesses likely contributed to the violation.

## Complete Workflow Example

This example demonstrates a typical minimization workflow. Assume a fuzzing campaign detected a violation:

```bash
rvzr fuzz -s base.json -c config.yaml -n 1000 -i 25 -w .
```

The fuzzer created a violation directory (e.g., `violation-000000-000000`) containing the test case artifacts.

### Step 1: Minimize the Program

Apply all program passes to simplify the test case while preserving the violation:

```bash
rvzr minimize -s base.json -c ./violation-000000-000000/minimize.yaml \
    -t ./violation-000000-000000/program.asm \
    -o min.asm -i 25 --num-attempts 3 \
    --enable-instruction-pass 1 \
    --enable-simplification-pass 1 \
    --enable-nop-pass 1 \
    --enable-constant-pass 1 \
    --enable-mask-pass 1 \
    --enable-label-pass 1
```

### Step 2: Verify Program Minimization

Confirm the minimized program still triggers the violation:

```bash
rvzr fuzz -s base.json -c ./violation-000000-000000/minimize.yaml -t min.asm -i 25
```

If the violation is no longer detected, reduce `--num-attempts` or disable some passes, then retry step 1.

### Step 3: Minimize Inputs and Add Annotations

Apply input passes and analysis passes to further simplify the test case and add helpful comments:

```bash
rvzr minimize -s base.json -c ./violation-000000-000000/minimize.yaml \
    -t min.asm -o commented.asm -i 25 \
    --input-outdir ./inputs \
    --enable-input-diff-pass 1 \
    --enable-input-seq-pass 1 \
    --enable-comment-pass 1
```

### Step 4: Verify Complete Minimization

Reproduce the violation with the minimized program and inputs:

```bash
rvzr reproduce -s base.json -c ./violation-000000-000000/reproduce.yaml \
    -t commented.asm -i ./inputs/min_input*.bin
```

If successful, the minimized test case in `commented.asm` and `./inputs/` is ready for detailed analysis. The annotated comments will help identify the root cause of the violation.

!!! tip "Troubleshooting Failed Minimization"
    If minimization breaks the violation, try these adjustments:

    - Reduce `--num-attempts` to perform fewer iterations
    - Disable aggressive passes like `--enable-simplification-pass`
    - Minimize the program before minimizing inputs
    - Check that `data_generator_seed` matches the original fuzzing campaign


## What's Next?

Once a violation is minimized, the next step is typically to analyze it manually to understand the root cause. The [How to Root-Cause a Violation](root-cause-a-violation.md) guide is dedicated to this topic.

## See Also

- [Minimization Passes](../ref/minimization-passes.md) - Complete list of available passes and their options
- [CLI Reference](../ref/cli.md) - Full command-line interface documentation
- [Execution Modes](../ref/modes.md) - Overview of all Revizor execution modes
- [Configuration Options](../ref/config.md) - Configuration file reference including `data_generator_seed`
- [How to Design a Fuzzing Campaign](design-campaign.md) - Set up effective fuzzing campaigns
- [How to Interpret Results](interpret-results.md) - Understand fuzzing outputs and violation reports
- [Trace Analysis and Violation Detection](../topics/trace-analysis.md) - Understanding how violations are detected


================================================
FILE: docs/howto/root-cause-a-violation.md
================================================
# How to Root-Cause a Violation

This guide discussed in detail how to identify the root cause of confirmed contract violations. This guide shows a typical workflow and some useful techniques for analyzing violation artifacts and isolating the specific CPU behavior that leads to information leakage.

!!! warning "Art, Not Science"
    Root-causing violations is more art than science. The techniques described here are not guaranteed to work in every situation because violations can arise from a wide variety of complex CPU behaviors. Use your intuition and knowledge of microarchitecture to guide your analysis. Experiment with different approaches and document what works best for you.

!!! info "Prerequisites"
    The guide assume you have already finished a [fuzzing campaign](design-campaign.md) and [minimized the violation artifacts](minimize.md).

## Locate the Violation Files

We will explore the root-cause analysis through a concrete example. The example will demonstrate a CT-SEQ contract violation on an x86-64 CPU.

We will be working with:

- The violation artifact in `violation-0000-0000/` produced during fuzzing
- A minimized version of the violation program in `min.asm` produced by the minimizer
- A set of minimized input files in `./inputs/min_input_*.bin` produced by the minimizer
- The configuration file `config.yaml` used during fuzzing

## Gather Insights from Minimizer

A good starting point is to examine the output of the minimizer, especially from input minimization passes. These passes attempt to reduce the differences between inputs that trigger the violation, and thus they often highlight the specific data values that leak and that impact the violation.

Below is an example of the printed summary from the differential input minimizer:

```
[PASS 2] Differential Input Minimizer
  > Minimizing the difference between inputs 1 and 11

Address    +0x0     +0x40    +0x80    +0xc0    +0x100   +0x140   +0x180   +0x1c0
0x00000000 ........ ........ ........ ........ ........ ........ ........ ........
0x00000200 ........ =....... ........ ........ ........ ........ ........ ........
0x00000400 ........ ........ ........ ........ ........ ........ ........ ........
0x00000600 ........ ........ ........ ........ ........ ........ ........ ........
0x00000800 ........ ........ ........ ........ ........ ........ ........ ........
0x00000a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001000 ........ ........ ........ ........ ........ ........ ........ ........
0x00001200 ........ ........ ........ ........ ........ ........ ........ ........
0x00001400 ........ ........ ........ ........ ........ ........ ........ ........
0x00001600 ........ ........ ........ ........ ........ ........ ........ ........
0x00001800 ........ ........ ........ ........ ........ ........ ........ ........
0x00001a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00002000 .....^..
0x00002040 ........ ........ ........ ........
  > Result: Leaked 1 bytes
  > Addresses: ['0x2028']
```

The minimizer goes through the pair of inputs that trigger the violation - inputs #1 and #11 in this case - and tries to minimize the differences between them:

* If both inputs already have identical values at a given address, the minimizer prints `=` for that address. In this example, this is the case for address `0x240`.
* Next, the pass attempts to zero out one byte at a time in both inputs. If the violation persists, then the minimizer prints `.` for that address. In this example, most of the addresses are zeroed out.
* Next, the pass attempts to copy one byte from input #1 into the same address in input #11. If the violation persists, then the minimizer prints `+` for that address. This example does not have such cases.
* If both attempts fail, the pass restores the original values at the given address, prints `^`, and moves to the next address. In this example, the minimizer restored the original value at address `0x2028`.

The interpretation of these results is case-specific, but generally, the values with `+` or `=` are those that create conditions for leakage, and the values with `^` are the addresses whose value leaks.

In this example, the minimizer found that this test case leaks one byte at address `0x2028` (used to initialize RDI). The minimizer also found that the address `0x240` must contain specific non-zero values that must be the same in both inputs. This address in the input is used to initialize the corresponding offset in the sandbox of actor 0. See [Sandbox Memory Layout](https://microsoft.github.io/side-channel-fuzzer/user/sandbox/) for more details about register and memory initialization.

!!! tip "Minimizer Behavior"
    Ideally, the minimizer should be able to reduce the leakage to a single byte. If more then a couple bytes leak, it typically indicates that the violation is non-deterministic, and it might be a good idea to re-run the program minimizer or to change the configuration to increase the number of attempts/increase the noise threshold. If *no* bytes leak, this is a certain sign that something went wrong; re-run the minimizer.

## Step 3: Add Comments to Minimized Program

Run the minimizer again with the `comment` pass enabled to annotate the minimized program with memory access information. This will help you map hardware traces to specific instructions in the program.

```bash
rvzr minimize -s base.json -c ./violation-0000-0000/minimize.yaml \
    -t min.asm -o commented.asm -i <num_inputs> \
    --enable-comment-pass 1
```

## Insert Speculation Fences

To isolate speculative behavior, add fences:

```bash
rvzr minimize -s base.json -c ./violation-0000-0000/minimize.yaml \
    -t commented.asm -o fenced.asm -i <num_inputs> \
    --enable-fence-pass 1
```

This pass with attempt to insert an `LFENCE` after every instruction in the program and check if the violation still occurs.

In the resulting file (`fenced.asm`) the region *without* fences is the one that causes the violation. The remaining instructions are just setting up the data for the violation, and are likely irrelevant.

!!! warning "Unexpected Fence Insertion Results"
    If an `LFENCE` is inserted after *every* instruction in the test case and the violation still occurs, this is most likely due to a bug in the model or the executor. If you are using a custom model, consider checking the model for correctness. If you haven't made changes to the Revizor source code, please, open an issue in the [bug tracker](https://github.com/microsoft/side-channel-fuzzer/issues).

## Map Hardware Traces to Minimized Program and Data

When both program and its inputs are minimized, you should be able to identify which instructions caused the cache accesses in the hardware traces and which data was leaked.

When we run the `reproduce` command with the minimized program and inputs, we will see the following hardware traces:

```bash
rvzr reproduce -s base.json -c ./violation-0000-0000/reproduce.yaml \
    -t commented.asm -i ./inputs/min_input*.bin

...

================================ Violations detected ==========================
-----------------------------------------------------------------------------------
                             HTrace                              | ID:1   | ID:11 |
-----------------------------------------------------------------------------------
^...............................................^............... | 420    | 0     |
^............................................................... | 80     | 0     |
^..............^................................................ | 0      | 500   |
```

!!! tip "Input IDs"
    If in your case the input IDs have changed after minimization, you can either exclude some of the inputs from the arguments of the `reproduce` command, or re-run the minimizer with fewer passes.

We see that the hardware traces have been significantly simplified compared to the original violation, and now there are at most two accessed cache sets in each trace: 0 and 48 for input #1, and 0 and 15 for input #11. This is a good sign: the minimization was successful.

We can also tell that the only difference between the two traces is the accessed cache set 48 vs 15 . This is the cache set that is causing the violation, and we should be aiming to find the instruction that does the access.

To do so, let's look at the contents of the `commented.asm` file. This file contains the minimized program with comments that show which memory addresses or cache lines are accessed by each instruction.

```assembly
; ... skipped header ...
1.  and rax, 0b1111111111111 # instrumentation
2.  lfence
3.  mov edx, dword ptr [r14 + rax]
4.  # mem access: [1] 0x0 cl 0:0 | [11] 0x0 cl 0:0
5.  or cx, 0b1000 # instrumentation
6.  and cl, 0b11111000 # instrumentation
7.  and dx, 0b11 #
8.  and rsi, 0b1111111111111 #
9.  add cl, 39 #
10. mov rbx, 0b1111111111111 #
11. bt si, dx
12. jbe .bb_0.1
13. jmp .exit_0
14. .bb_0.1:
15. mov ecx, edi
16. and rcx, 0b1111111111000 # instrumentation
17. mov byte ptr [r14 + rcx], 88
; ... skipped footer ...
```

This program contains only two memory accesses, at lines 3 and 17.

The [annotation](minimize.md#comment-pass-output) at line 4 tells us that the `mov` instruction accesses memory offset `0x0` when executed with input 1 (`[1]`) and the same cache set when executed with input 11 (`[11]`). The notation `0:0` stands for cache set `0` and cache line offset `0`.

This information lets us map this instruction to the first access in the hardware trace:

```plaintext
    ^...............................................^...............
    |
  This eviction maps to `mov edx, dword ptr [r14 + rax]` at line 3
```

The second memory access (line 17) does not have an annotation, which implies that the contract model has not executed this instruction with the inputs provided. It does not, however, mean that the CPU has not executed this instruction, as there is a chance that this instruction was executed speculatively. This is a typical scenario in violations detected by Revizor.

If we look at the instructions prior to the memory access, we can see `jbe` instruction at line 12, which is a conditional jump - a common source of speculation, namely branch prediction. This type of speculation is not permitted by the target contract (CT-SEQ), so it could cause a violation. From this, we can make a hypothesis that the memory access at line 17 is speculative and is the one causing the second cache access:

```plaintext
 Inputs [1]:
              Hypothesis: This eviction maps to `mov` at line 17
                                                  |
  ^...............................................^...............

 Inputs [11]:
  ^..............^................................................
                 |
           Hypothesis: This eviction maps to `mov` at line 17
```

To check if our hypothesis is correct, let's cross-reference this information with the leaked bytes from the differential input minimizer:

```plaintext
; .. skip zero bytes
0x00002000 .....^..
0x00002040 ........ ........ ........ ........
  > Result: Leaked 1 bytes
  > Addresses: ['0x2028']
```

This summary tells us that `rdi` has a differing value between inputs #1 and 11. At the same time, the first time `rdi` is used in the program is at line 15, where it is moved to `rcx`, and then later used as a part of the address in the memory access at line 17. This would make the speculative memory access at line 17 access different addresses with the two inputs, and would explain the difference between the hardware traces.

At this point, the hypothesis is more-or-less confirmed, and we can declare that the root cause of the leak was the misprediction of the `jbe` branch at line 12, which caused the speculative execution of the memory access at line 17, and which in turn leaked the value of `rdi`.

If we want to further increase our confidence, we can manually inspect the contents of the inputs at the address `0x2028` to see if the values correspond to the cache set ID that we observe in the hardware traces. This can be done by running the `hexdump` command on the input files:

```bash
$ hexdump -C ./inputs/min_input_0001.bin | grep 2020
00002020  00 00 00 00 00 00 00 00  1e 1c 4a 00 1e 1c 4a 00  |..........J...J.|
$ hexdump -C ./inputs/min_input_0011.bin | grep 2020
00002020  00 00 00 00 00 00 00 00  c8 13 58 00 c8 13 58 00  |..........X...X.|
```

The values are `0x4a1c1e004a1c1e` for input #1 and `0x5813c8005813c8` for input #11. These are masked with `0b1111111111000` by `and` at line 16 and become `7192` and `5064` respectively. If we translate these values to cache set IDs (`id = (addr % 0x1000) // 64`), we get `48` and `15`. These values match the cache set IDs that we observed in the hardware traces, which confirms our hypothesis.

If we want even more confidence, we can manually modify the input files (e.g, with `hexedit` tool) to see if the hardware traces change when we modify the value of `rdi` in the input files.


---

## Modify the Program

In many cases, the minimization process will not provide a clear result as in the example above and you will not be able to make a specific hypothesis about the root cause of the violation. In such cases, you can try to modify the program in various ways to see if the violation still occurs. There are no strict rules on which modifications to make and you will have to rely on your intuition and knowledge of the target microarchitecture, but here are some general guidelines:

1. **Simplify Instructions**: Start by trying to manually replace instructions in `minimized.asm` with simpler ones. For example, replace complex instructions with memory operands with simple loads or stores.
2. **Increase/Decrease Aliasing**: Try to change the addresses of memory accesses to match (or not match if they already do) the addresses of other instruction. Such aliasing often triggers speculation (e.g., in Speculative Store Bypass or MDS attacks).
3. **Add/Remove Dependent Instructions**: If you have a hypothesis about which instruction triggers speculation, try adding or removing data-dependent instructions before it. This will change the size of the speculative window and might change hardware traces, which will give you more insight into the violation.
4. **Change Memory Permissions**: If the violation is related to memory accesses, try changing the permissions of the memory regions that are accessed by the program. For example, if the memory is read-only, try changing it to read-write. If the violation disappears, it might indicate that the violation is related to the permission checks in the CPU.
5. **Change Instruction Operands**: Try changing operands to add or remove data dependencies between instructions. For example, if you have a sequence of two moves `mov rax, [rax]; mov rbx, [rax]`, try changing the second move to `mov rbx, [rbx]` to see if the violation still occurs if there are no data dependencies between the instructions.

After each modification, run the `reproduce` command to see if the violation still occurs:

```bash
rvzr reproduce -s base.json -c ./violation-<timestamp>/reproduce.yaml \
    -t modified.asm -i ./inputs/min_input*.bin
```


!!! tip "Share Your Findings"
    If you find any other strategies that work well, please consider sharing them by opening a pull request to this documentation. We would love to hear about your experiences and learn from them.


## See Also

- [How to Interpret Violation Results](interpret-results.md) - Understanding and validating violations before root-cause analysis
- [How to Minimize Test Cases](minimize.md) - Complete minimization workflow and pass descriptions
- [Minimization Passes](../ref/minimization-passes.md) - Reference documentation for all minimization passes
- [Configuration Options](../ref/config.md) - Configuration parameters for reproduction and minimization
- [Command-Line Interface](../ref/cli.md) - Complete CLI reference for all execution modes
- [Sandbox Memory Layout](../ref/sandbox.md) - Understanding input file structure and register initialization
- [Trace Analysis and Violation Detection](../topics/trace-analysis.md) - How Revizor detects violations
- [Contracts and Leakage Models](../topics/contracts.md) - Understanding contract semantics


================================================
FILE: docs/howto/use-macros.md
================================================
# How To Use Macros

This document explains the concept of macros in Revizor and describes how to create test cases that use macros.

Note that macros are especially useful in the template-based mode of Revizor, so if you are not familiar, check out the [Template-Based Mode](../howto/use-templates.md) documentation as well.

## What is a macro?

Macros in Revizor are special pseudo-instructions that provide a flexible way to insert complex operations into test cases. They appear as labels of a special format in the assembly code but are dynamically expanded into actual implementations during execution by the model and the executor.

Macros solve two key challenges, especially in the context of multi-domain testing:

* Structuring: Enable insertion of pre-defined instruction sequences (like domain transitions or microarchitectural isolation primitives) within randomized test contexts
* Unification: Allow the same test case template to be instantiated differently across executor and model stages, accommodating differences in ISA support.

## Why use macros?

Macros exist to provide extra flexibility and convenience when creating test case. There are certain operations that are cumbersome or impractical to express directly in assembly code, and macros serve to abstract away these complexities.


## Macro Definition and Usage

### Assembly Syntax

Macros use standard assembly syntax of a label with the `.macro` prefix:

```assembly
.macro.macro_name.argument1.argument2.argument3.argument4:
```

A macro can take at most four arguments. The arguments are strictly static; Revizor does not support dynamic arguments in macros, such as registers or memory addresses.


### Example Usage

A user can create a test case program where only a subset of instruction is measured by using `measurement_start` and `measurement_end` macros:

```asm
.intel_syntax noprefix
.section .data.main

... ; non-measured code here

.macro.measurement_start:

... ; measured code here

.macro.measurement_end:

... ; non-measured code here

.test_case_exit:
```

Revizor will automatically replace the macros with no-op operations of an ISA-dependent size, and record the location and the arguments of the macros in the test case metadata. When the executor and the model run the test case, they will recognize these macros and execute the corresponding logic. Note that the logic can be configurable, e.g., when the user has set `executor_mode: P+P` (prime+probe), the `measurement_start` macro will correspond the Prime stage of the measurement, and `measurement_end` will correspond to the Probe stage.

See [Implementation Overview](#implementation-overview) for details on how macros are implemented in the executor and model.

## Implementation Overview

### Internal Representation of Macros

Revizor internally replaces all macros with a no-op placeholder of a fixed size (8 bytes for x86-64, 12 bytes for ARM64). This placeholder is used to maintain the original instruction flow while allowing the executor and model to recognize and handle macros dynamically. The macro location, type, and arguments are stored in the test case metadata, namely in the `SYMBOL TABLE` section of the [RCBF File Format](../ref/binary-formats.md), where `owner` is set to the actor ID of the actor that contains the macro, `offset` is the offset of the macro placeholder in the code section of the actor, `id` is the macro type (defined in [executor_km/include/macro_expansion.h](https://github.com/microsoft/side-channel-fuzzer/blob/main/src/x86/executor/include/macro_loader.h)), and `args` is a compressed representation of the macro arguments.

### Macros in Executor

Each actor's code section contains a dedicated memory region for macros, and the implementation is copied there during test case initialization. The executor copies the implementations of all macros into this section, and it replaces the macro placeholders with direct jumps to the corresponding implementations. The executor also inserts a return jump at the end of each macro implementation to return control flow back to the original instruction sequence.

For example, if we have a simple test case like this:

```asm
.macro.measurement_start:
... ; some code here
.macro.measurement_end:
.test_case_exit:
```

The executor with expand it as follows:

```asm
jump measurement_start_impl
lfence
.l1:
... ; some code here
jump measurement_end_impl
lfence
.l2:
.test_case_exit:

.macro_code_section:
measurement_start_impl:
... ; sequence of instructions that implements the macro
jump .l1  ; jump to the end of the macro section

measurement_end_impl:
... ; sequence of instructions that implements the macro
jump .l2  ; jump to the end of the macro section
```

Note that the executor also inserts LFENCE barriers after each macro jump. This is to ensure that the macro execution does not trigger straight-line speculation, which could interfere with the measurement process.


### Macros in Model

In the model, macros are implemented as dynamic callbacks. The model executes a hook function on every instruction execution, checking if the current instruction matches an entry in the symbol table. If a match is found, the model invokes the corresponding callback function to emulate the macro behavior.


================================================
FILE: docs/howto/use-templates.md
================================================
# How to Use Templates

Template-based mode (`tfuzz`) enables targeted testing of specific CPU scenarios by using predefined assembly templates that get expanded with random instructions. This mode narrows down the fuzzing space to focus on particular interaction patterns while maintaining randomization within those patterns.

## Overview

Template-based mode generates test cases from assembly templates containing macros that get dynamically expanded during generation. Templates define the structure and flow of test cases while allowing specific sections to be populated with random instructions based on configuration.

## Command Line Usage

Template-based mode is invoked using the `rvzr tfuzz` command. The invocation is almost identical to the normal `rvzr fuzz` mode, but it takes an additional `-t` or `--template` parameter to specify the assembly template file.

Invocation example:

```bash
rvzr tfuzz -t template.asm -c config.yaml -s base.json -n 10 -i 100
```

where `template.asm` is the template file.


## Template Structure

Templates are assembly files that combine:

- Regular assembly instructions
- Macros (special pseudo-instructions as described in [Macros](../ref/macros.md))

Example template:

```asm
.intel_syntax noprefix
.section .data.main

.macro.random_instructions.10.0:  ; Replaced with 10 random instructions
div rax, rbx                      ; rax and rbx may be set by random instructions
jmp .test_case_exit               ; Jump to exit point if no exception occurs

.fault_handler:
    .macro.random_instructions.10.1:  ; Generate 10 random instructions executed when a fault occurs

.test_case_exit:
```

Revizor will take this template and replace the `.macro.random_instructions.N` with N random instructions from the instruction pool defined in the configuration file. A new test case will be generated this way in each fuzzing round, allowing for a wide variety of test cases while still adhering to the structure defined in the template. For example, if `-n 10` is specified, the generator will produce 10 test cases based on the template, each with different random instruction sequences.


================================================
FILE: docs/index.md
================================================
---
title: "Revizor"
hide:
  - navigation
  - toc
---

<style>
.md-typeset h1,
.md-content__button {
    display: none;
}

.hero-section {
    text-align: center;
    max-width: 800px;
    margin: 0 auto;
}

.hero-section img {
    max-width: 320px;
    height: auto;
}

.hero-section p {
    margin: 0;
}

.hero-section .tagline {
    color: var(--md-default-fg-color--light);
    font-size: 1.5rem;
    font-weight: 300;
    margin-top: 1.0rem;
    margin-bottom: 5rem;
}

.grid.cards > ul > li {
    text-align: center;
}

.grid.cards > ul > li > p > strong{
    font-size: 1.1rem;
}

.grid.cards > ul > li > p.text {
    text-align: justify;
    margin: 1rem;
}

.grid.cards > ul > li .md-button {
    margin: 0.25rem;
}

h2 {
    text-align: center;
    margin-top: 3rem;
    margin-bottom: 1rem;
}

h2 > strong {
    font-weight: 700;
    font-size: 1.8rem;
}


</style>

<div class="hero-section" markdown>

<img src="./assets/logo.svg#only-light" alt="Revizor Logo" align="center" width="320px" />
<img src="./assets/logo-light.svg#only-dark" alt="Revizor Logo" align="center" width="320px" />

<p class="tagline">Hardware fuzzing for the age of speculation</p>

</div>

<div class="grid cards" markdown>

-   __:fontawesome-solid-arrow-right: Get Started__

    ---

    <p class="text">
    Welcome to the Revizor documentation! Whether you're a new user looking to get started or a developer interested in contributing, you'll find all the information you need here.
    </p>

    [Start Here](intro/start-here.md){ .md-button .md-button--primary }
    [Learn Revizor](intro/01-overview.md){ .md-button }
    [Ask a Question](howto/ask-a-question.md){ .md-button }
    [Cite Revizor](ref/papers.md){ .md-button }


- __:fontawesome-solid-code: Source Code__

    ---

    <p class="text">
    The Revizor project lives on GitHub. Explore the source code, report issues, and contribute to the project.
    </br></br></br>
    </p>


    [GitHub](https://github.com/microsoft/side-channel-fuzzer){ .md-button }
    [Contributing](internals/contributing/overview.md){ .md-button }
    [Bug Reports](https://github.com/microsoft/side-channel-fuzzer/issues){ .md-button }
    [Explore Docs](structure.md){ .md-button }


- __:fontawesome-solid-comments: Join the Community__

    ---

    <p class="text">
    Join the Revizor community to get help, discuss ideas, suggest features, and share your experiences.
    </br></br></br>
    </p>

    [Zulip Community](https://rvzr.zulipchat.com/){ .md-button }
    [GitHub Discussions](https://github.com/microsoft/side-channel-fuzzer/discussions){ .md-button }

</div>

---

## __:fontawesome-solid-bug: Trophies__{ .trophies-header }

#### Transient Scheduler Attack - L1 Cache (TSA-L1)

=== "Description"
    A speculative leak affecting AMD Family 19h processors where false completions in load instructions can leak data from the L1 data cache across security boundaries. The attack exploits the linear address-based microtag system used for L1 cache lookups - when a load finds a matching microtag entry but the L1 doesn't contain valid data, invalid data from the matching microtag entry is used in a false completion. This leak enables information disclosure between kernel/userspace, hypervisor/guest, across different applications or VMs, and from SEV-SNP VMs to the host.
=== "CVE"
    [CVE-2024-36357](https://nvd.nist.gov/vuln/detail/CVE-2024-36357)
=== "Links"
    * More details in: [Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://aka.ms/enter-exit-leak)
    * AMD Security Advisory: [Advisory](https://www.amd.com/en/resources/product-security/bulletin/amd-sb-7029.html)


#### Transient Scheduler Attack - Store Queue (TSA-SQ)

=== "Description"
    A speculative leak affecting AMD Family 19h processors where false completions in Store-To-Load Forwarding operations can leak data from previous store instructions. When a load matches an older store's address but the store data isn't yet available, a false completion occurs using invalid data from a previously executed store that occupied the same store queue entry. This effect enables information leakage from the OS kernel to user applications, hypervisor to guest, and to a lesser extent, between application.
=== "CVE"
    [CVE-2024-36350](https://cve.mitre.org/cgi-bin/cvename.cgi?name=2024-36350)
=== "Links"
    * More details in: [Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://aka.ms/enter-exit-leak)
    * AMD Security Advisory: [Advisory](https://www.amd.com/en/resources/product-security/bulletin/amd-sb-7029.html)

#### Control Register Speculation

=== "Description"
    A speculative leak affecting AMD processors where user processes can speculatively infer control register values even when User Mode Instruction Prevention (UMIP) is enabled. This bypasses intended security boundaries by allowing unprivileged code to access system-level configuration information through speculative channels.
=== "CVE"
    [CVE-2024-36348](https://cve.mitre.org/cgi-bin/cvename.cgi?name=CVE-2024-36348)
=== "Links"
    * More details in: [Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://aka.ms/enter-exit-leak)
    * AMD Security Advisory: [Advisory](https://www.amd.com/en/resources/product-security/bulletin/amd-sb-7029.html)

#### TSC_AUX Speculation

=== "Description"
    A speculative leak affecting AMD processors affecting AMD processors that permits user processes to infer the Time Stamp Counter Auxiliary (TSC_AUX) register value even when direct reads are disabled.
=== "CVE"
    [CVE-2024-36349](https://nvd.nist.gov/vuln/detail/CVE-2024-36349)
=== "Links"
    * More details in: [Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://aka.ms/enter-exit-leak)
    * AMD Security Advisory: [Advisory](https://www.amd.com/en/resources/product-security/bulletin/amd-sb-7029.html)


#### Divider State Sampling (DSS)

=== "Description"
    A speculative leak where division-by-zero operations can transiently return values that depend on previous division operations. The leaked state persists across privilege boundaries. The discovery of the leak triggered a patch to the Linux kernel as well as other operating systems.
=== "CVE"
    [CVE-2023-20588](https://nvd.nist.gov/vuln/detail/CVE-2023-20588)
=== "Links"
    More details in: [Speculation at Fault](https://www.usenix.org/system/files/usenixsecurity23-hofmann.pdf)

#### String Comparison Overrun (SCO)

=== "Description"
    Revizor discovered that string operations on Intel and AMD CPUs (in particular, string comparison and string scan) can speculatively bypass the bounds of their target strings, which permits the attacker to leak data from out-of-bounds memory locations.
=== "Links"
    More details in: [Hide & Seek with Spectres](https://www.microsoft.com/en-us/research/publication/hide-and-seek-with-spectres-efficient-discovery-of-speculative-information-leaks-with-random-testing/)

#### Zero Dividend Injection (ZDI)

=== "Description"
    64-bit division operations on Intel CPUs can speculative ignore the upper bits of the divisor, thus producing an incorrect computational result. This speculation can potentially impact the security of cryptographic algorithms that use division to implement modulo operations.
=== "Links"
    More details in: [Hide & Seek with Spectres](https://www.microsoft.com/en-us/research/publication/hide-and-seek-with-spectres-efficient-discovery-of-speculative-information-leaks-with-random-testing/)

#### Read-Modify-Write Speculation

=== "Description"
    A new variant of Microarchitectural Data Sampling (MDS) where a store operation to read-only memory triggers speculative behavior. When a read-modify-write instruction (like XADD) attempts to access read-only memory, it speculatively returns stale data from internal CPU buffers, even though the read itself would be permitted.
=== "Links"
    More details in: [Speculation at Fault](https://www.usenix.org/system/files/usenixsecurity23-hofmann.pdf)

#### Non-canonical Store Forwarding

=== "Description"
    A speculative leak where stores to non-canonical addresses can be forwarded to subsequent loads from the canonical versions of those addresses. This means that even though a store operation fails due to an invalid address format, its data can still be transiently accessed by later instructions using a related valid address.
=== "Links"
    More details in: [Speculation at Fault](https://www.usenix.org/system/files/usenixsecurity23-hofmann.pdf)

#### Variable-latency Spectre

=== "Description"
    A variant of Spectre vulnerability where the leakage is caused by the race condition that appears when a speculative memory access is data-dependent on a variable-latency instruction. This race condition can expose the operands of the variable-latency instruction.
=== "Links"
    More details in [the Revizor paper](https://www.microsoft.com/en-us/research/publication/revizor-testing-black-box-cpus-against-speculation-contracts/)

#### Store-based Spectre V1

=== "Description"
    Several defense proposals (e.g., STT, KLEESpectre) assumed that stores do not modify the cache state until they retire. We used Revizor to validate this assumption, and discovered that is not true on recent Intel CPUs (e.g., CoffeeLake).
=== "Links"
    More details in [the Revizor paper](https://www.microsoft.com/en-us/research/publication/revizor-testing-black-box-cpus-against-speculation-contracts/)

#### Speculative Store with Forwarding

=== "Description"
    Revizor discovered that two consecutive loads from the same address can speculatively return two different values if one of them receives a forwarded value from a store while the other load experiences a speculative store bypass. This combination exposes more information to the attacker compared to the original store bypass.
=== "Links"
    More details in [the appendix to the Revizor paper](https://www.microsoft.com/en-us/research/publication/revizor-testing-black-box-cpus-against-speculation-contracts/)

<!--
### Reproduced Vulnerabilities

- [Spectre V1 (Bounds Check Bypass, BCB)](https://spectreattack.com/)
- [Spectre V4 (Speculative Store Bypass, SSBP)](https://www.intel.com/content/www/us/en/developer/articles/technical/software-security-guidance/advisory-guidance/speculative-store-bypass.html)
- [Meltdown (SMAP variant)](https://meltdownattack.com/)
- [Foreshadow (L1TF)](https://foreshadowattack.eu/)
- [Microarchitectural Data Sampling (MDS)](https://www.intel.com/content/www/us/en/developer/articles/technical/software-security-guidance/advisory-guidance/microarchitectural-data-sampling.html)
- [Load Value Injection (LVI), including LVI-Null](https://www.intel.com/content/www/us/en/developer/articles/technical/software-security-guidance/technical-documentation/load-value-injection.html)
 -->


================================================
FILE: docs/internals/architecture/analysis.md
================================================
|                  |                    |
| ---------------- | ------------------ |
| Module           | `rvzr/analyser.py` |
| Public interface | `Analyser`         |
| Inputs           | `CTrace`, `HTrace` |
| Outputs          | `Violation`        |

The Analyser compares contract traces with hardware traces to detect violations. The core principle: inputs with identical CTraces should produce equivalent HTraces. When they don't, a contract violation has occurred.

```python
For all inputs i, j:
    if CTrace(i) == CTrace(j) and HTrace(i) != HTrace(j):
        → Violation detected
```

Analyser implementations:

Different analysers define "equivalent HTrace" differently:

- `MergedBitmapAnalyser` (default) — Merges samples using bitwise OR, compares bitmaps. For cache-based channels.
- `SetAnalyser` — Compares sets of unique samples.
- `MWUAnalyser` — Uses Mann-Whitney U statistical test. For timing-based channels.
- `ChiSquaredAnalyser` — Uses chi-squared test for distribution differences.


================================================
FILE: docs/internals/architecture/code.md
================================================
# Test Case Code Generation

|                  |                          |
| ---------------- | ------------------------ |
| Module           | `rvzr/code_generator.py` |
| Public interface | `CodeGenerator`          |
| Inputs           | `InstructionSet`         |
| Outputs          | `TestCaseProgram`        |

This module generates random assembly programs for testing. The generator creates programs designed to trigger speculative execution and expose microarchitectural leaks.

### Generation process

1. Create control flow graph — Generate a random Directed Acyclic Graph (DAG) of basic blocks. The DAG structure prevents infinite loops while allowing branches and mispredictions.

2. Add jump instructions — Insert conditional and unconditional jumps at block boundaries to connect the blocks according to the DAG.

3. Fill basic blocks — Populate blocks with random instructions from the tested instruction pool, respecting instruction frequencies and operand constraints.

4. Instrument — (Optionally) Prevent faults by masking memory addresses, avoiding division by zero, and ensuring all accesses stay within the sandbox.

5. Assemble — Convert to binary and extract metadata.

6. Transform into RCBF — Serialize the test case into Revizor's custom binary format ([RCBF](../../ref/binary-formats.md)) for execution.

### Test case representation

```text
TestCaseProgram
  ├─ CodeSection (one per actor)
  │    └─ Function
  │         └─ BasicBlock
  │              └─ InstructionNode
  │                   └─ Instruction
  │                        └─ Operand
  └─ TestCaseBinary
       └─ SymbolTable
```

### Variants

Architecture-specific implementations of the code generator exist for x86 and ARM64, named `X86Generator` and `ARM64Generator` in `rvzr/arch/*/code_generator.py`


================================================
FILE: docs/internals/architecture/data.md
================================================
# Test Case Data Generation

|                  |                          |
| ---------------- | ------------------------ |
| Module           | `rvzr/data_generator.py` |
| Public interface | `DataGenerator`          |
| Inputs           | `Config`                 |
| Outputs          | `InputData`              |

`DataGenerator` generates input data that is used to initialize registers and memory before executing a test case, on both the model and the target hardware.


## Generation modes

Two input generation modes are supported:

### Standard generation

Interface: `DataGenerator.generate(...)`

This method creates fully random inputs using a PRNG. Can optionally reduce entropy (to increase trace collisions) or inject special values (zeros, boundary values) to trigger edge cases.

### Boosted generation

Interface: `DataGenerator.generate_boosted(...)`

Boosted generation solves the following challenge:
Two detect a violation via relational non-interference testing, we always need at least two inputs that produce identical contract traces (see [Trace Analysis](overview.md#6-trace-analysis)). Generating such contract-equivalent inputs through pure randomness is extremely inefficient because the entropy of contract traces is usually very high, and thus most random inputs produce unique traces.

Boosted generation addresses this by leveraging dynamic taint analysis on the model side. It works as follows: Start by producing a set of random inputs using standard generation. Then, we execute the test case with each input in the model and perform backwards taint analysis to identify which input bytes affect the contract trace (tainted) and which don't (untainted). This produces a set of `InputTaint` objects that map input bytes to their taint status. These taint maps a fed back into the `generate_boosted()` method, which creates new inputs such that the tainted bytes remain fixed while the untainted bytes are randomized.

```text
Original InputData → Model → InputTaint → N contract-equivalent inputs
```

Such "boosted" inputs are guaranteed to produce the same contract trace as the original input while still being mostly random.


## Data Representation

Each input is represented as an `InputData` object, which is a numpy structured array containing

- Memory contents
- General-purpose registers
- SIMD registers
- Flags and special registers

for each actor in the test case. This object can be serialized into Revizor's custom binary format ([RDBF](../../ref/binary-formats.md)) for consumption by the model and executor.


================================================
FILE: docs/internals/architecture/exec.md
================================================
# Hardware Tracing

|                  |                                         |
| ---------------- | --------------------------------------- |
| Module           | `rvzr/executor.py`, `rvzr/executor_km/` |
| Public interface | `Executor`                              |
| Inputs           | `TestCaseProgram`, `InputData`          |
| Outputs          | `HTrace`                                |

## Executor

The Executor runs test cases on real hardware and collects hardware traces (HTraces) using side-channel measurements. It uses a two-layer architecture: Python code communicates with a kernel module that performs measurements in kernel space.

```text
Python (executor.py)
  ├─ X86IntelExecutor
  ├─ X86AMDExecutor
  └─ ARM64Executor
       │
       │ /sys/rvzr_executor/ interface
       ▼
Kernel Module (executor_km/)
```

## HTrace representation

The `HTrace` class (`rvzr/traces.py`) represents hardware traces collected during execution. The executor produces one `HTrace` object per program-input pair, meaning that for each `TestCaseProgram` execution with each `InputData` input, one `HTrace` is generated.

Each `HTrace` encapsulates multiple measurements results (samples): This is because the executor typically repeats the execution several times and each execution produces one measurement sample. Such repeated measurements allow us to apply statistical methods when comparing noisy hardware traces (see [Trace Analysis](analysis.md) below).

The structure of an `HTrace` is as follows:

```text
HTrace
  └─ Array[RawHTraceSample]
       ├─ trace       Main measurement (cache bitmap, timestamp, or registers)
       └─ pfc0-pfc4   Performance counter values
```


================================================
FILE: docs/internals/architecture/fuzz.md
================================================
# Orchestration Module

|                  |                                          |
| ---------------- | ---------------------------------------- |
| Module           | `rvzr/fuzzer.py`                         |
| Public interface | `Fuzzer`                                 |
| Inputs           | `Config`, `InstructionSet`, ASM Template |
| Outputs          | Violation artifact, logs                 |

The `Fuzzer` class is the main coordinator. It manages the core components (`CodeGenerator`, `DataGenerator`, `Model`, `Executor`, and `Analyser`) and orchestrates the fuzzing loop.

## Main workflow

```text
Fuzzer.start()
  └─> for each test case:
        ├─> CodeGenerator.create_test_case() → TestCaseProgram
        ├─> DataGenerator.generate() → List[InputData]
        └─> Fuzzer.fuzzing_round(program, inputs)
              ├─> Model.trace_test_case() → List[CTrace]
              ├─> Executor.trace_test_case() → List[HTrace]
              ├─> Analyser.filter_violations() → List[Violation]
              └─> if violation: multi-stage filtering pipeline
```


## Multi-stage filtering

When a potential violation is found, the Fuzzer runs it through several validation stages. Each stage modifies parameters and re-checks the violation to rule out false positives:

1. `fast` — Initial fast detection using minimal speculative nesting on the model side and small sample size on the executor side
2. `nesting` — Re-collect ctraces with the model using full speculative nesting. This rules out false positives caused by incomplete speculation modeling
3. `taint_mistake` — Re-collect ctraces for the boosted inputs to rule out boosting-based generation mistakes
4. `priming` — Perform a so-called "priming test" (swap the order of violating inputs) to rule out false positives caused by inconsistent microarchitectural state across executions
5. `noise` — Increase sample size on the executor side to increase statistical confidence and rule out noise-induced violations
6. `arch_mismatch` — Compare the architectural output (i.e., register/memory states) of the model and executor to rule out violations caused by functional mismatches (i.e., by bugs in the model or executor)

If a violation survives all stages, Revizor saves a reproduction package (called "violation artifact") containing the test case, inputs, configuration, and detailed report.

## Fuzzer variants

The `Fuzzer` class is abstract. There are several variants modifying the baseline logic:

- `X86Fuzzer` / `ARM64Fuzzer` — Architecture-specific implementations
- `ArchitecturalFuzzer` — Validates model correctness (i.e., performs stage 6 `arch_mismatch` for all test cases, even non-violating ones)
- `ArchDiffFuzzer` — Completely discards the model, and instead compares two hardware executions, one with a normal test case and one with a speculation fence added after every instruction. This variant is used to detect speculation-induced architectural bugs, like zenbleed.


================================================
FILE: docs/internals/architecture/isa.md
================================================
# Instruction Set Specification

|                  |                    |
| ---------------- | ------------------ |
| Module           | `rvzr/isa_spec.py` |
| Public interface | `InstructionSet`   |
| Inputs           | `base.json`        |
| Outputs          | `InstructionSet`   |

This module manages the instruction set available for fuzzing. It loads ISA definitions from a JSON file (`base.json`) and applies user-configured filters to create a pool of allowed instructions.

Each instruction is represented by an `InstructionSpec` containing instruction name and category, operand specifications, and instruction properties.

Processing pipeline:

1. Load ISA specification from JSON
2. Apply filters (allowlist, blocklist, categories, register restrictions)
3. Remove duplicates
4. Categorize instructions by type (control flow, memory access, etc.)


================================================
FILE: docs/internals/architecture/logging.md
================================================
# Logging

|                  |                               |
| ---------------- | ----------------------------- |
| Module           | `rvzr/logs.py`                |
| Public interface | `FuzzLogger`, etc.            |
| Inputs           | N/A                           |
| Outputs          | Log messages (stdout, stderr) |

Revizor uses a centralized logging system with configurable verbosity. The system uses the Borg pattern to share state across modules.

Available logging modes:

- info — General messages and progress
- stat — Statistics
- dbg_* — Debug modes for specific components

Logging components:

- Basic functions: `error()`, `warning()`, `inform()`, `dbg()`
- Module-specific loggers: `FuzzLogger`, `GeneratorLogger`, `ISALogger`, `ExecutorLogger`, `AnalyserLogger`


================================================
FILE: docs/internals/architecture/mini.md
================================================
# Post-violation Analysis

|                  |                                 |
| ---------------- | ------------------------------- |
| Module           | `rvzr/postprocessing/`          |
| Public interface | `Minimizer`                     |
| Inputs           | Violation artifact (.asm, .bin) |
| Outputs          | Minimized test case and inputs  |

After confirming a violation, users can run post-processing to simplify the test case and identify the root cause. The postprocessing module applies minimization passes that reduce complexity while preserving the violation.

Class hierarchy:

```text
Minimizer
  └─ Orchestrates passes, manages files

BaseMinimizationPass
  ├─ Instruction passes (modify code)
  ├─ Data passes (modify inputs)
  └─ Analysis passes (add annotations)
```

Instruction passes (operate on test case code):

- `InstructionRemovalPass` — Remove instructions one at a time to find essential ones
- `NopReplacementPass` — Replace with NOPs (preserves alignment)
- `InstructionSimplificationPass` — Replace complex instructions with simpler ones
- `ConstantSimplificationPass` — Simplify immediate values
- `MaskSimplificationPass` — Simplify bitmasks
- `LabelRemovalPass` — Remove unused labels
- `FenceInsertionPass` — Insert fences to identify speculation boundaries

Data passes (operate on inputs):

- `DifferentialInputMinimizerPass` — Use delta debugging to find minimal byte differences
- `InputSequenceMinimizationPass` — Reduce number of inputs

Analysis passes (add annotations):

- `AddViolationCommentsPass` — Annotate assembly with memory addresses from execution


================================================
FILE: docs/internals/architecture/model.md
================================================
# Contract Tracing

|                  |                                |
| ---------------- | ------------------------------ |
| Module           | `rvzr/model.py`                |
| Public interface | `Model`                        |
| Inputs           | `TestCaseProgram`, `InputData` |
| Outputs          | `CTrace`                       |

## Model

The Model executes test cases according to a leakage contract and produces contract traces (CTraces). These represent the information expected to leak during execution, including speculative execution.

Revizor supports two model backends:

- **Unicorn**: This backend is based on the [Unicorn CPU emulator](https://www.unicorn-engine.org/). It implements the contract by hooking into instruction execution and memory access events. Documentation is provided in [Unicorn Backend](../model-backends/model-unicorn.md).
- **DynamoRIO**: This backend uses [DynamoRIO](https://dynamorio.org/) for dynamic binary instrumentation. It instruments the test case to insert hooks for tracing and speculation simulation. Documentation is provided in [DynamoRIO Backend](../model-backends/model-dr.md).

Both implement the same interface defined by the abstract `Model` class.

## Contract Trace Representation

A `CTrace` is a sequence of typed observations representing leaked information:

```text
CTrace
  └─ List[CTraceEntry]
       ├─ mem    Memory address
       ├─ pc     Program counter
       ├─ val    Data value
       ├─ reg    Register value
       └─ ind    Indirect branch target
```

CTraces use `xxhash` for fast equality checking, enabling efficient grouping into equivalence classes.


================================================
FILE: docs/internals/architecture/overview.md
================================================
# Architecture Overview & Code Structure

This document introduces Revizor's architecture and key components. It is designed to provide an overview of how the codebase is organized and how the main pieces work together.

!!! info "Prerequisites"
    This document assumes familiarity with the concepts of side-channel attacks, speculative execution, and [Speculation Contracts and Model-based Relational Testing (MRT)](../../topics/contracts.md).

## How Revizor Works

Revizor detects CPU security vulnerabilities using Model-based Relational Testing (MRT). The core idea is to compare what a CPU should leak (according to a leakage model) with what it actually leaks during execution.

Basic process:

1. Generate random assembly programs
2. Execute them on both a leakage model and real hardware
3. Compare the observed hardware behavior with the model's predictions
4. If they match, the CPU behaves as expected (discard the test)
5. If they differ, a potential vulnerability has been found

The leakage model acts as a reference model of the expected CPU behavior. If the real CPU leaks more information than the model predicts (i.e., if it diverges from the reference), this indicates a potential security vulnerability. For details on how leakage models work, see [Speculation Contracts](../../topics/contracts.md).

Revizor runs the following loop until it finds a violation or completes the configured number of test cases:

![architecture](../../assets/fuzzing-flow.png)

## 1. Initialization

This step runs once at startup. Revizor reads the fuzzing configuration, which specifies:

- Target CPU architecture
- ISA (instruction set) specification
- Which instructions to test
- Which side channels to monitor
- Other fuzzing parameters

The `cli.py` module handles command-line arguments and creates the main objects: `InstructionSet` (from `isa_spec.py`), `Config` (from `config.py`), and `Fuzzer` (from `fuzzer.py`).

## 2. Code Generation

Each fuzzing round starts by generating a random test program. This is an assembly program with semi-random control flow, built from a pool of allowed instructions.

The code generator can be configured to control the shape of the control flow graph, which instructions to include, and how often each instruction appears. It also (optionally) instruments the program to prevent faults like division by zero.

The `Fuzzer` calls `CodeGenerator.create_test_case()` (in `code_generator.py`), which returns a `TestCaseProgram` object representing the generated assembly program.

## 3. Data Generation

Next, Revizor generates random inputs for the test program. Each input contains initial values for registers and memory. These values are pseudo-random but use fixed seeds for reproducibility.

The `DataGenerator` class (in `data_generator.py`) creates these inputs and returns them as `InputData` objects. See [binary formats](../../ref/binary-formats.md#revizor-data-binary-format-rdbf) for the structure of input data.

## 3.5 Test Case Filtering (Optional)

Some test cases are unlikely to reveal vulnerabilities, so Revizor can filter them out early to save time. This is optional and disabled by default.

Two filters are available:

- Speculation filter: Uses performance counters to check if the test case triggers branch mispredictions. Without mispredictions, the test cannot expose speculative leaks.
- Observation filter: Compares the original test case with a "fenced" version (with serialization instructions added). If both produce identical traces, speculation left no observable effects.

These filters are implemented in architecture-specific fuzzer classes (like `X86Fuzzer` in `rvzr/arch/x86/fuzzer.py`).

## 4. Model Execution

The model executes the test program with each generated input and produces contract traces (CTraces). These traces represent what the model predicts should leak during execution.

The `Model` class (in `model.py`) provides two key methods:

- `load_test_case()`: Loads the program into the model
- `trace_test_case()`: Executes the program with each input and returns CTraces

Revizor supports multiple model backends: [Unicorn](../model-backends/model-unicorn.md) (CPU emulator) and [DynamoRIO](../model-backends/model-dr.md) (dynamic instrumentation). Both implement the same interface.

## 5. Hardware Execution

The executor runs the test program on the target hardware with each input and collects hardware traces (HTraces). A hardware trace is a set of observable microarchitectural effects (like cache state or timing) caused by the test case execution. Traces are typically collected using side-channel techniques (e.g., Prime+Probe, Flush+Reload) or by reading performance counters.

To ensure that the measurements reflect the test case execution (rather than noise), the executor creates a controlled measurement environment by disabling interrupts, flushing caches, and repeating executions multiple times.

The `Executor` class (in `executor.py`) works through a kernel module (`executor_km/`) that performs measurements in kernel space. It provides the same interface as the model: `load_test_case()` and `trace_test_case()`.

## 6. Trace Analysis

The analyzer compares contract traces (what should leak) with hardware traces (what actually leaked) to detect violations. Instead of directly comparing traces, it uses an equivalence class approach.

How it works:

1. Group by contract: Inputs with identical CTraces form a ContractEqClass. According to the model, these inputs should be indistinguishable.
2. Group by hardware: Within each ContractEqClass, inputs with similar HTraces form HardwareEqClasses. These inputs are actually indistinguishable on real hardware.
3. Detect violations: If a ContractEqClass splits into multiple HardwareEqClasses, a violation has occurred. The model says the inputs should look the same, but hardware reveals differences between them.

This approach focuses on information leakage rather than exact trace values, and it essentially implements a non-interference check (see [Theoretical Foundations](../../topics/contracts.md)).

The `Analyser` class (in `analyser.py`) implements this logic in its `filter_violations()` method.

## 7. Post-violation Analysis

When Revizor detects a potential violation, it runs additional tests to filter out false positives. These tests modify execution parameters and verify the violation still occurs. See [post-violation tests](mini.md) for details.

If the violation survives all filters, Revizor reports it to the user and saves reproduction artifacts. The user can then use [minimization tools](../../howto/minimize.md) to simplify the test case and identify the root cause.

The post-violation logic is implemented in `Fuzzer.fuzzing_round()`, and the `FuzzLogger` class handles reporting.


================================================
FILE: docs/internals/code-structure.md
================================================
# Code Structure

The Revizor codebase is organized into the following main directories:

```text
rvzr/                         Main source code directory containing core fuzzing logic
  ├── *.py                    Core modules that implement main fuzzing components
  ├── tc_components/          Test case representation objects (code and data)
  ├── model_unicorn/          Unicorn-based leakage model
  ├── model_dynamorio/        DynamoRIO-based leakage model
  ├── executor_km/            Kernel module that implements the hardware executor
  ├── postprocessing/         Minimization utilities for contract counterexamples
  └── arch/                   Architecture-specific implementations (x86/ and arm64/)
tests/                        Unit and integration tests
docs/                         Documentation files
```

The main entry point is `rvzr/cli.py`, which parses command-line arguments and initializes the `Fuzzer` object.


================================================
FILE: docs/internals/contributing/code-style.md
================================================
# Code Style

Please follow these coding standards when writing code for inclusion in Revizor.

## Python

* Unless otherwise specified, follow PEP 8. But remember that PEP 8 is only a guide, so respect the style of the surrounding code as a primary goal.
* An exception to PEP 8 is our rules on line lengths. Don’t limit lines of code to 79 characters if it means the code looks significantly uglier or is harder to read. We allow up to 100 characters.
* All files should be formatted using the `flake8` auto-formatter. Use all default settings except for the line width (`--max-line-length 100`)
* The Python and C files use 4 spaces for indentation, and YAML uses 2 spaces.
* The project repository includes an .editorconfig file. We recommend using a text editor with EditorConfig support to avoid indentation and whitespace issues.
* Use underscores, not camelCase, for variable, function and method names (i.e. poll.get_unique_voters(), not poll.getUniqueVoters()).
* Use InitialCaps for class names (or for factory functions that return classes).
* In docstrings, follow PEP 257.

## C

* All files should be formatted using the `clang-format`. The settings are included into the `.clang-format` files in the directories with C files. Just run the formatter with: `clang-format -i *.c`

## Misc

* Remove import statements that are no longer used when you change code. flake8 will identify these imports for you. If an unused import needs to remain for backwards-compatibility, mark the end of with `# NOQA` to silence the flake8 warning.
* Systematically remove all trailing whitespaces from your code as those add unnecessary bytes, add visual clutter to the patches and can also occasionally cause unnecessary merge conflicts. Some IDE’s can be configured to automatically remove them and most VCS tools can be set to highlight them in diff outputs.


================================================
FILE: docs/internals/contributing/general.md
================================================
# General Development Guidelines

## Testing

To run automated tests you will need to install a few more dependencies:

* [Bash Automated Testing System](https://bats-core.readthedocs.io/en/latest/index.html)
* [mypy](https://mypy.readthedocs.io/en/latest/getting_started.html#installing-and-running-mypy)
* [flake8](https://flake8.pycqa.org/en/latest/index.html)

With the dependencies installed, you can run the tests with:

```bash
./tests/runtests.sh
```

Note that some of the acceptance tests are microarchitecture-dependent.
These tests are labeled "Detection" (e.g., `"Detection [spectre-type] Spectre V1; load variant"`), and they may fail if the CPU under test does not have a given vulnerability.
Generally, if a few of these tests fail, it is not a problem, but if all of them (or a significant portion) fail, it indicates an issue with the fuzzer.

## Submitting Patches

To submit a patch, use the following procedure:

* Fork Revizor on github:

    [https://docs.github.com/en/github/getting-started-with-github/fork-a-repo](https://docs.github.com/en/github/getting-started-with-github/fork-a-repo)

* Create a topic branch:

```bash
git checkout -b my_branch
```

* Make sure all tests pass (see [Testing](#testing))
* Make sure your code follows the guidelines in [Code Style](code-style.md)
* Push to your branch

```bash
git push origin my_branch
```

* Initiate a pull request on github:

    [https://docs.github.com/en/github/collaborating-with-issues-and-pull-requests/creating-a-pull-request](https://docs.github.com/en/github/collaborating-with-issues-and-pull-requests/creating-a-pull-request)

* Wait for the PR to get reviewed and merged


================================================
FILE: docs/internals/contributing/git.md
================================================
# Git Workflow Guidelines

## Git Messages

We practice the following conventions for commit messages:

```
<scope>: [<type>] <subject>
```

Where:

* `<scope>`: The scope of the change.
* `<type>`: The type of the change.
* `<subject>`: A short description of the change.


### Scopes

The following scopes are typical:


| Scope       | Description                                                      |
| ----------- | ---------------------------------------------------------------- |
| `all`       | Changes that affect the entire project (e.g., major refactoring) |
| `root`      | Root directory changes (e.g., readme, git, author list)          |
| `fuzz`      | Changes to the core fuzzer algorithm.                            |
| `cli`       | Changes to the command-line interface.                           |
| `exec`      | Changes to the executor.                                         |
| `model`     | Changes to the model.                                            |
| `analyser`  | Changes to the analyser.                                         |
| `mini`      | Changes to the postprocessor (i.e., minimizer).                  |
| `code_gen`  | Changes to the program generator                                 |
| `data_gen`  | Changes to the input generator                                   |
| `tests`     | Changes to the tests                                             |
| `isa`       | Changes to the ISA loader or to `get_spec` files                 |

If a commit covers several scopes, use the most relevant one.

If a commit targets a specific architecture (e.g., x86), add the architecture to the scope (e.g., `fuzz/x86`).

### Types

Use one of the following types:

| Type     | Description                                                                   |
| -------- | ----------------------------------------------------------------------------- |
| `feat`   | A new feature.                                                                |
| `fix`    | A bug fix.                                                                    |
| `docs`   | Documentation changes.                                                        |
| `chore`  | Changes to the build process or auxiliary tools.                              |
| `ft`     | Fault tolerance changes (e.g., adding error handling or recovery mechanisms). |
| `refact` | Refactoring of the codebase. This includes code style change.                 |
| `perf`   | Performance improvements.                                                     |
| `revert` | Reverts a previous commit.                                                    |

If possible, try to use only these types.
If you need to use a different type, please discuss it with a maintainer.

## Git Branches

We practice the [git workflow](https://git-scm.com/docs/gitworkflows), with a few modifications.

![branching workflow](../../assets/branches.png)

We use the following branches for graduation:

* `main`: The latest release. This branch should always be stable, and it is the last branch to receive changes.
* `main-fixes`: Commits that go in the next maintenance release. This branch is created from the last release branch.
* `dev`: The development branch. This branch is the first to receive changes.

Commits should be merged upwards:

* `dev` -> `pre-release` -> `main`
* In case of hot fixes, `main-fixes` -> `main` AND `main-fixes` -> `pre-release`

For working on unstable code (e.g., progress on features or bug fixes), use either forks or feature branches.
Use forks if you are the only one working on the feature, and use a pull request to merge the changes back into the main repository.
Use a feature branch if multiple people are working on the feature, in which case name the branch `feature-<name>` or `bugfix-<name>`, and make sure to branch from the `dev` branch.

The only exception is the `gh-pages` branch, which is used for the project's website.
This branch is used by automated tools and should never be used for development.


================================================
FILE: docs/internals/contributing/overview.md
================================================
# Guide to Contributing

This document provides an overview of how to contribute to the Revizor project.

## What can I contribute?

Revizor is an open-source project, and we welcome contributions of all kinds. You don't have to be an expert in hardware security or fuzzing to contribute! Even small contributions are valuable.

Here are some ways you can help:

* :fontawesome-solid-bug: Report Issues: The easiest way to contribute is by reporting issues you encounter while using Revizor. Try following the introductory [guides and tutorials](../../intro/start-here.md), and if you find any issues, bugs, or unclear documentation, please report them on our [GitHub Issues page](https://github.com/microsoft/side-channel-fuzzer/issues).
* :fontawesome-solid-pencil: Improve Documentation: You can also contribute by improving the documentation. If you find any gaps, outdated information -- even typos -- feel free to submit a pull request with your improvements.
* :fontawesome-solid-code: Code Contributions: If you're interested in coding, you can contribute new features, fix bugs, or enhance existing functionality. Check out the [issue tracker](https://github.com/microsoft/side-channel-fuzzer/issues) for open issues and feature requests.
* :fontawesome-solid-lightbulb: New Features: Finally, if you have expertise in hardware security, fuzzing, or related areas, consider contributing new features and enhancements to Revizor (see [ideas for contributions](#ideas-for-contributions) if you need inspiration).

## Reporting Bugs and Issues

To report a bug or an issue, please use the [GitHub Issues page](https://github.com/microsoft/side-channel-fuzzer/issues).

If you're reporting a simple bug, it is sufficient to provide a small description of the problem and the environment in which it occurred (Revizor version, target architecture, OS, etc.).

For more complex issues, especially those related to the fuzzing process, also include the configuration file you've used and the command-line arguments.

The recommended report template is as follows:

```
## Description
A clear and concise description of what the bug is.

## To Reproduce
1. Go to '...'
2. Run '...'
3. See error

## Expected behavior
A clear and concise description of what you expected to happen.

**Environment**
- Revizor version:
- Architecture:
- OS:
...

## Additional context
Add any other context about the problem here.

## Attachments
- Configuration file used:
- Command-line arguments:
- Logs or error messages:
```

## Submitting Patches

To submit a patch, be it to the code or to the documentation, use the following procedure:

* [Fork Revizor on github](https://docs.github.com/en/github/getting-started-with-github/fork-a-repo)
* Create a topic branch (`git checkout -b my_branch`)
* Make and commit your changes in the new branch
* Make sure all tests pass (`./tests/runtests.sh <target_ISA>`) and that the code is formatted accordingly to the [Code Style](code-style.md) guidelines.
* Push to your branch (`git push origin my_branch`)
* [Initiate a pull request on github](https://docs.github.com/en/github/collaborating-with-issues-and-pull-requests/creating-a-pull-request)
* Wait for the PR to get reviewed and merged

#### Contributor License Agreement and Code of Conduct

Most contributions require you to agree to a
Contributor License Agreement (CLA) declaring that you have the right to, and actually do, grant us
the rights to use your contribution. For details, visit [https://cla.opensource.microsoft.com](https://cla.opensource.microsoft.com).

When you submit a pull request, a CLA bot will automatically determine whether you need to provide
a CLA and decorate the PR appropriately (e.g., status check, comment). Simply follow the instructions
provided by the bot. You will only need to do this once across all repos using our CLA.

This project has adopted the [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/).
For more information see the [Code of Conduct FAQ](https://opensource.microsoft.com/codeofconduct/faq/) or
contact [opencode@microsoft.com](mailto:opencode@microsoft.com) with any additional questions or comments.

## <a name="ideas-for-contributions"></a> Ideas for Contributions

If you're looking for ideas and inspiration on how you can meaningfully extend and improve Revizor, here are some suggestions:

---

#### Add Support for New Instructions

There are quite many specialized instructions that Revizor does not yet fully support. Implementing support for these instructions can help improve the coverage and effectiveness of the fuzzer. As a bonus, you might discover new type of information leaks in the process.

These include, but are not limited to:

* Floating-point instructions (either x87 or SSE/AVX)
* Segment-based memory accesses or instructions that manipulate segment registers
* Complex control-flow instructions (e.g., `call`, `ret`, indirect jumps)
* MMX instructions

---

#### Make Generators Smarter

Both code and data generators can be improved in various ways to produce more effective test cases. The bar is fairly low here, as current generators are fully random.

Ideas include:

* Bias generators to produce values that are more likely to trigger edge cases (e.g., boundary values, special bit patterns)
* Implement ability to control the frequency of certain instruction types in generated programs
* Implement mutation-based generation strategies that modify existing test cases to explore new behaviors

If you decide to work on any of these or have your own ideas, please discuss them with us first by reaching out on [GitHub Discussions](https://github.com/microsoft/side-channel-fuzzer/discussions) or opening a draft pull request. This way we can ensure that your efforts align with the project's goals and avoid duplication of work.

---

#### Improve Reporting Tools

The current logging and debugging tools in Revizor are relatively basic. Enhancing these utilities for better readability and usability can significantly aid users in understanding fuzzing results and diagnosing issues.

Ideas include:

* Refactor the logging module to output a live dashboard, similar to what is seen in other fuzzers like AFL or libFuzzer
* Improve the debugging output to improve readability when debugging models

---

#### Implement New Measurement Modes

Revizor currently collects side-channel observations primarily through cache measurements or by recording the execution time of test programs. Implementing additional measurement modes can help uncover new types of leaks and improve the fuzzer's effectiveness.

New measurement modes could include:

* Instruction cache measurements (e.g., using I-cache side channels)
* Contention-based measurements (e.g., measuring resource contention on the memory bus)
* Performance counter-based measurements (i.e., reading directly from CPU performance counters)

Beyond that -- if you're brave enough -- you could attempt implementing concurrent measurement modes, for example, by running each actor in a test case on a different core or SMT thread. This is a complex task that requires significant changes to executor, and might require new techniques for dealing with non-determinism and imprecise synchronization. But if successful, it could open up new avenues for discovering cross-core or cross-thread leaks. You might even make a paper out of it.

---

#### Implement Coverage-Guided Fuzzing

Another interesting avenue for exploration is implementing proxy-based coverage metrics. Currently, Revizor runs in a fully random mode, without any feedback being collected in the process of fuzzing. Implementing coverage-guided fuzzing techniques could significantly improve the efficiency of the fuzzer.

Ideas include:

* Proxy-based coverage metrics, where an emulator or a simulator is used as a proxy for the CPU coverage. That is, the fuzzer would run test cases on an emulator, collect the software coverage information (which edges of the emulator code were executed), and use that to guide the generation of new test cases.
* Specification-based coverage metrics, where a formal specification of the instructions (e.g., ARM Architecture Specification Language) is used to determine edge cases in the execution of instructions. The fuzzer would then aim to cover all possible behaviors defined in the specification.


================================================
FILE: docs/internals/index.md
================================================
# Developer Documentation

This section provides technical documentation for developers contributing to Revizor.

## Development Guidelines

- [Guide to Contributing](contributing/overview.md): Overview of the contribution process and resources
- [General Guidelines](contributing/general.md): Development environment setup, testing procedures, contribution workflow
- [Code Style](contributing/code-style.md): Formatting conventions for Python and C code, naming conventions
- [Git Workflow](contributing/git.md): Branch management, commit message format, merge procedures

## Architecture and Modules

- [Code Structure](code-structure.md): Organization of the source code directory and key modules
- [Overview](architecture/overview.md): High-level system architecture and component interaction
    - [Orchestration](architecture/fuzz.md): Main fuzzing loop and coordination between components
    - [ISA Specification](architecture/isa.md): Instruction set architecture definitions and JSON-based specification format
    - [Test Case Code Generation](architecture/code.md): Program generation algorithm and relevant classes
    - [Test Case Data Generation](architecture/data.md): Data generation algorithm and relevant classes
    - [Hardware Tracing](architecture/exec.md): Execution of test cases on the target HW and hardware trace collection
    - [Contract Tracing](architecture/model.md): Leakage modeling and contract trace generation (high-level overview; implementation details in backend-specific pages)
    - [Trace Analysis](architecture/analysis.md): Comparison of contract and hardware traces to detect violations
    - [Minimization](architecture/mini.md): Post-detection reduction of test cases to minimal reproducing examples
    - [Logging](architecture/logging.md): Logging infrastructure and debugging facilities

## Contract Modeling Backends

Revizor supports two different backends for contract-based leakage modeling. They are documented in the following pages:

- [Unicorn Backend](model-backends/model-unicorn.md): Backend based on the Unicorn CPU emulator
- [DynamoRIO Backend](model-backends/model-dr.md): Backend based on the DynamoRIO dynamic binary instrumentation engine


================================================
FILE: docs/internals/model-backends/model-dr.md
================================================
# DynamoRIO-based Model Backend

This document describes the DynamoRIO-based model.
As any other model, this backend is responsible for collecting contract traces for generated test cases.

## Design Overview

This backend is composed of several parts:

* The Python adapter (`rvzr/model_dynamorio/model.py`) is responsible for receiving a test case from Revizor, transforming it into a format that can be executed by the backend, triggering the backend to execute the test case, and returning the collected contract traces to Revizor.
* The Test Case Loader (`rvzr/model_dynamorio/adapter.c`) is a C program that loads a test case program and a batch of inputs into its memory, and executes the test case program with each input in a sequence.
* The DynamoRIO components (`rvzr/model_dynamorio/backend`) are executed together with the test case loader, and they instrument the loader binary to collect contract traces.

These components can be roughly divided into the instrumentation-time components that are responsible for modifying the binary, and execution-time components that implement the model logic (i.e., the contract).

[![DynamoRIO-based Model Backend](../../assets/dr-model.png)](../../assets/dr-model.png)

## Python Adapter

Revizor communicates with the backend through a Python adapter (`rvzr/model_dynamorio/model.py:DynamoRIOModel`).

At the beginning of the fuzzing process, Revizor configures the backend by calling `configure_clauses` method.
This configuration will be later passed down to the backend when the test case is executed.

During the fuzzing process, Revizor sends test cases to the backend by calling `load_test_case` method, and then triggers the backend to execute the test case by calling `trace_test_case` method.
Internally, `trace_test_case` will call the backend to execute the test case and collect the contract traces.
The adapter will then parse the traces and return them back to the caller.

The `trace_test_case` method implements the following algorithm:

- Convert test case program and inputs into RCBF and RDBF files, respectively
- For each input, call the test case loader with the RCBF and RDBF files. Attach the DynamoRIO backend to the call so that the binary instrumentation is performed:
```shell
~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so --tracer <observation-clause> -- ~/.local/dynamorio/adapter <rcbf> <rdbf>
```
- Parse contract traces from the backend and convert them into `CTrace` objects
- Return the list of collected `CTrace` objects to the caller (usually, `fuzzer.py`)

## Test Case Loader

Since the test cases produced by Revizor are raw binaries, they cannot be directly executed (e.g., they don't have `libc` linked).
The test case loader (`rvzr/model_dynamorio/adapter.c`) is a simple C program that fixes this issue by providing a wrapper around the test case binary.

The loader implements the following algorithm:

- Receive the test case binary and an input from the Python adapter via CLI arguments
- Load the test case binary and the input into dedicated memory regions
- Print the addresses of the test case and input memory regions (for trace normalization)
- Initialize registers based on the input
- Jump to the test case binary entry point
- Return

## DynamoRIO Tool

The DynamoRIO tool (`rvzr/model_dynamorio/backend`) is responsible for instrumenting the test case loader binary and collecting contract traces.

### Implementation Overview

All instrumentation logic is implemented as a DynamoRIO client. In particular,
`model.cpp` contains the event callbacks that are executed at instrumentation time,
while `dispatcher.cpp` contains the body of the callbacks that are inserted
by the DR client and are executed before every instruction at runtime. Finally, the `Dispatcher` object holds the state that is
shared between instrumentation-time callbacks and execution-time callbacks.

The following figure provides an overview of the implementation.

[![DynamoRIO Instrumentation Overview](../../assets/dr-instrumentation.png)](../../assets/dr-instrumentation.png)

1. `dr_client_main()` is responsible of installing the initial instrumentation callbacks to hook all relevant DR events (`module_load`, `bb_translation`, exceptions and the `exit` event)
2. `dr_client_main()` also sets the name of the function to instrument (passed by `cli.cpp`)
3. on `module_load`, the instrumentation checks for the presence of the target function in the loaded module. If found, the callback adds a `drwarp` callback (`event_instrumentation_start`) which will be executed at the start of the target function
4. once a call to the target function is found, the `event_instrumentation_start` will save the return address in a global object (`instrumented_func`) and call `start()` on the dispatcher
5. from that moment on, every translated basic block is instrumented by our client, in particular:
    - a `dispatch_callback()` is inserted before every instruction
    - at the function exit point (i.e. the previously saved return addres) an `exit_callback` is inserted
6. these callbacks are executed at runtime with the following effects:
    - the `dispatch_callback()` implements the observation and execution clauses (see next section)
    - the `exit_callback()` checks the current speculation state before exiting:
        - speculative exits cause a rollback
        - architectural exit causes the instrumentation to stop

Finally, exceptions and the `exit` event are also forwarded to the Dispatcher:

- Speculative **exceptions** will cause a rollback, while architectural ones are forwarded to the target program
- The **exit** event stops instrumentation and flushes all logs (in case the exit callback has not been executed architecturally)

### Instrumentation Components

The instrumentation components modify the binary of the test case loader by adding a call to the function `dispatch_callback` before every instruction in the binary (or more specifically, every instruction in the `test_case_entry` function of the loader).

The tool interacts with DynamoRIO through the `model.cpp` module.
This module registers an event for entering the `test_case_entry`, which triggers the flush of the internal DynamoRIO code fragment cache and the start of instrumentation.
The module also registers an event for every instruction in the `test_case_entry`, and the event in turn calls the `Dispatch::instrument_instruction()`. Finally, exceptions are hooked and passed to the dispatcher through `Dispatch::handle_exception()`, which can decide to either handle the signal (e.g. on speculative paths) or forward it to the test case (e.g. architectural exceptions).

The `Dispatch` class implements the actual instrumentation logic.
When the `instrument_instruction()` method is called, it inserts a clean call to the `dispatch_callback` function before the instruction.
The call receives the PC and opcode of the instruction as arguments.
DynamoRIO also automatically saves the complete register state before the call, thus making it available to `dispatch_callback`.

### Execution-Time Components

The execution-time components are responsible for implementing the contract logic, and are triggered by the `dispatch_callback` function.
At the current state of the backend, the dispatch callback invokes only two classes, Tracer and Speculator, that implement the observation and execution clauses, respectively. Optionally, each component can log additional events, e.g.
speculation rollbacks or the current register state, through a shared `Logger` component.

Subclasses of `TracerABC` record contract-relevant information via `observe_instruction` and `observe_mem_access` methods.
E.g., `TracerCT` implements `CT` observation clause by recording the PC of instructions upon `observe_instruction` and the address of memory accesses upon `observe_mem_access`. Currently, `observe_exception` simply adds a special entry to the trace to indicate that the program ended due to an (architectural) exception.

Subclasses of `SpeculatorABC` implement the contract speculation logic.
E.g., `SpeculatorCond` implements `speculate_instruction`.
When this method is called with a branch instruction, the class takes a checkpoint of the process state, flips the branch condition (i.e., modified `FLAGS` register), and continues the execution.
During the simulated speculation, each call to `speculate_instruction` counts the number of executed instructions, and when the number reaches the limit (e.g., 256), the class restores the checkpoint and continues the execution from the original state. (Actually, the algorithm is more complex, but this is the general idea.)

When the instrumentation ends (according to `model.cpp`), the tracer's `tracing_finalized` method is called, during which any remaining traces are flushed into the trace file, together with an "End Of Trace" entry.
The Python adapter will then read the trace file, decode it, and return the corresponding CTrace to Revizor.

### Standalone Usage

The DR tool can be used as a standalone tool to collect the runtime trace of any program, independently from the rest of Revizor's infrastructure.

A typical usage is for example:

```shell
~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so --tracer <observation-clause> --speculator <speculation-clause> -- ls /dev/null
```

By default, this will instrument `ls` starting from `__libc_start_main` until the end of the program, run it with `/dev/null` as an argument, and generate a binary file called `rvzr_trace.dat` that contains the collected trace. Other flags can be printed using `~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so -h`

The trace file location can be changed by adding `--trace-output <PATH>`. Additionally, the tool can also dump the trace in human-readable format to STDOUT using the `--print-trace` flag.

To decode and analyze the trace file, downstream tools should always use the `TraceDecoder` class provided by `trace_decoder.py`. For internal usage, this module also provides a simple entrypoint for trace printing:

```bash
python3 trace_decoder.py rzvr_trace.dat
```

#### Debugging

Attaching a debugger like GDB to the DR tool might not always be the best debugging option, as the program has three separate states:

1. the state of the program being instrumented (e.g. `ls`)
2. the state of the DR client (`libdr_model.so`) instrumentation
3. the state of DynamoRIO itself (`drrun`)

More information about debugging DR clients can be found [here](https://dynamorio.org/page_debugging.html).

For our instrumentation, other (possibly simpler) options are available:

1. **Inspecting Debug Traces**: the DR tool can optionally log extra information, e.g. the complete state of the register file before each instruction, each value being read and written to memory, and speculation events like checkpoints are rollbacks, in a separate debug trace:
    - This option can be enabled using `--log-level <N>`
    - By default, the tool will dump debug entries to `rzvr_dbg_trace.dat` in binary format; to change the path of the debug trace file use `--debug-output <PATH>`
    - `--print-debug-trace` can be used to pretty-print debug entries to STDOUT during execution
    - `trace_decoder.py` also provides a decoder for debug entries
    - **WARNING:** debug traces can become very big, especially for nested speculation
2. **Running DynamoRIO with logging**: DynamoRIO can also produce logs (see DR documentation):

```
~/.local/dynamorio/drrun -debug -loglevel 3 -c ~/.local/dynamorio/libdr_model.so --tracer <observation-clause> --speculator <speculation-clause> -- ls /dev/null
```


================================================
FILE: docs/internals/model-backends/model-unicorn.md
================================================
# Unicorn Backend

Unicorn backend architecture:

```text
UnicornModel (main orchestrator)
  ├─ UnicornTracer            Records observations (PC, memory addresses, etc.)
  ├─ UnicornSpeculator        Simulates speculative execution
  ├─ UnicornTaintTracker      Tracks data flow for boosted input generation
  ├─ ExtraInterpreter         Handles features Unicorn doesn't support
  └─ InstructionCoverage      Tracks which instructions were tested
```

Key components:

- `UnicornModel`:   Manages the emulator and coordinates components through hooks on instruction and memory events.
- `UnicornTracer`:   Implements the observation clause of the contract. Different tracers record different information (program counters, memory addresses, data values).
- `UnicornSpeculator`:   Implements the speculation clause using checkpoint-rollback mechanisms. When speculation triggers (branch misprediction, CPU exception), it saves state and executes speculatively up to a window limit (default 250 instructions). It rolls back on serializing instructions or window expiration.
- `UnicornTaintTracker`:   Performs dynamic taint analysis to identify which input bytes affect the contract trace. Used for boosted input generation.


================================================
FILE: docs/intro/01-overview.md
================================================
# Revizor at a Glance

## What is Revizor?

Revizor is a security-oriented fuzzer that detects microarchitectural information leaks in CPUs—the vulnerabilities behind attacks like Spectre and Meltdown. It tests processors "blindly," requiring no prior knowledge of specific flaws or hardware internals. Instead, it compares actual CPU behaviour against a [*leakage contract*](../glossary.md#speculation-contract-aka-leakage-contract): a specification defining known sources of information leakage. Any discrepancy reveals a potential vulnerability.

## What Problems Does Revizor Solve?

Modern CPUs achieve their speed through speculative execution, out-of-order processing, complex caching, and other microarchitectural optimizations. These optimizations create side channels—timing variations, cache-state changes, buffer contentions—that can leak sensitive data. Such leaks are notoriously difficult to catch: they cause no crashes, depend on precise timing, and emerge only under specific conditions. Revizor automates the detection of these elusive side-channel leaks.

Specifically, Revizor addresses several key challenges:

* **Automated discovery**: Finding side-channel attacks manually demands deep (often undocumented) microarchitectural knowledge and extensive trial-and-error. Revizor automates this process, systematically exploring the CPU's behaviour by probing the microarchitecture with lots of automatically generated test cases.
* **Variant analysis**: Side-channel vulnerabilities spawn many variants. Revizor can search for new attack vectors that might bypass existing patches.
* **Validation of mitigations**: Vendor patches meant to close side channels have sometimes proven incomplete. Revizor verifies whether fixes actually eliminate the leakage.

## Quick Example: Detecting Spectre V1

To illustrate how Revizor works, consider a simple fuzzing campaign that will lead to a detection of a known vulnerability in most modern CPUs, namely Spectre V1.

!!! info "Prerequisites"
    Before running this example, ensure you have Revizor installed and set up correctly. Follow the [Installation Guide](02-install.md) if you haven't done so already.

We will use a configuration file in `demo/detect-v1.yaml`. This config file tells Revizor to test a small subset of x86-64 ISA (arithmetic instructions + conditional branches) against a contract that states that the CPU should not speculate and should only leak information about loads, stores, and the program counter. As most modern CPUs implement branch prediction, we expect to see a violation of this contract.

Run the fuzzer with the following command:

```bash
$ rvzr fuzz -s base.json -n 1000 -i 100 -c demo/detect-v1.yaml -w ./
```

After a short while, you should see output similar to this:

```
INFO: [prog_gen] Setting program_generator_seed to random value: 562112

INFO: [fuzzer] Starting at 14:00:51
13    ( 2%)| Stats: Cls:100/100,In:200,R:9,SF:5,OF:6,Fst:2...

================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:71  | ID:171|
-----------------------------------------------------------------------------------
^................^..^.....^.....................^.....^......... | 599    | 0     |
^...................^.....^..................................... | 28     | 23    |
^................^..^.....^.......^...^......................... | 0      | 604   |


================================ Statistics ===================================

Test Cases: 14
Inputs per test case: 200.0
Violations: 1
Effectiveness:
  Total Cls: 100.0
  Effective Cls: 100.0
Discarded Test Cases:
  Speculation Filter: 5
  Observation Filter: 6
  Fast Path: 2
  Max Nesting Check: 0
  Tainting Check: 0
  Early Priming Check: 0
  Large Sample Check: 0
  Priming Check: 0

Duration: 52.1
Finished at 14:01:43
```

This message indicates that Revizor found a [violation](../glossary.md#violation) of the specified
contract, and the tool will store the corresponding
[violation artifact](../glossary.md#violation-artifact-aka-contract-counterexample) in
`./violation-<timestamp>/`.

What happened here is that Revizor generated a series of random
[test programs](../glossary.md#test-case-program), executed them on the target CPU and the
reference model that implement the contract, collected the side-channel observations on both sides,
and compared them. In this case, one of the generated test programs produced two different
[hardware traces](../glossary.md#hardware-trace-htrace) for two different inputs while the model
(contract) produced the same trace for both inputs. This discrepancy indicates that the CPU leaked
information through microarchitectural side channels in a way that violates the specified contract.

The corresponding program and the [inputs](../glossary.md#test-case-data-aka-test-case-input) are
stored in the violation artifact (`./violation-<timestamp>/`), and it will contain an assembly file
`program.asm` that surfaced a violation, a sequence of inputs `input_*.bin` to this program, and
some details about the violation in `report.txt`.

If we inspect the assembly code in `program.asm` and do an analysis of the violation, we will most likely find that it is a gadget that implements a typical Spectre V1 pattern: a conditional branch and a speculative memory access that leaks data through the cache. (This is a most likely outcome because the pattern is statistically very common for the given configuration). For example, the program may look like this (simplified for illustration):

```assembly
.section .data.main
...
jnp .bb_0.1  // conditional branch
jmp .exit_0
.bb_0.1:
    ...
    or byte ptr [r14 + rcx], al  // data-dependent memory access
    ...
.exit_0:
.test_case_exit:
```

!!! info "On violation analysis"
    This example was intentionally chosen to have a straightforward output that directly corresponds to a known vulnerability pattern. In practice, analyzing violations can be more complex, especially for novel or less understood leaks. We won't go into the details of the analysis here as it is a relatively complex topic; refer to the [this guide](../howto/root-cause-a-violation.md) if you want to dive into the details.

The power of this approach is that Revizor doesn't need to know the specific vulnerability it's looking for. It simply tests whether the CPU matches the expected security specification. When it finds a discrepancy, that's a potential vulnerability worth investigating.

## What's Next?

Now that you understand what Revizor is and what it does, here are your next steps:

* **Dive Deeper into Concepts**: For a more detailed explanation of the information flow analysis used in Revizor, the concepts of leakage contracts, and other related topics, see the [Core Concepts Guide](03-primer.md).
* **Follow a Tutorial**: Our [step-by-step tutorial series](./04-tutorials.md) guides you through detecting your first vulnerability, understanding the results, and designing effective fuzzing campaigns.
* **Explore the Glossary**: Familiarize yourself with key terms and definitions in the [Glossary](../glossary.md) to better understand Revizor's terminology (we have quite a few unique terms!).
* **Get Help**: If you run into issues or have questions, visit our [FAQ](../faq/general.md) for common questions, or [ask a question](../howto/ask-a-question.md) to reach out to the community.


================================================
FILE: docs/intro/02-install.md
================================================
# Installation

**Warning**:
Revizor runs randomly-generated code in kernel space.
This means that a misconfiguration (or a bug) can crash the system and potentially lead to data loss.
Make sure you're not running Revizor on a production machine, and that you have a backup of your data.

### 1. Requirements

**Hardware**: x86-64 or ARM64 CPU. Specifically:

* All Intel and AMD x86-64 CPUs are supported.
* Some ARM CPUs are also supported, namely Microsoft Cobalt and Raspberry Pi. Other ARM CPUs may work, but are not officially supported.

**No virtualization**:
You will need a bare-metal OS installation.
Testing from inside a VM is not supported.

**OS**: The target machine has to be running Linux v4.15 or later.

### 2. Python Package

The preferred installation method is using `pip` within a virtual environment.
The python version must be 3.9 or later.

```bash
sudo apt install python3.9 python3.9-venv
/usr/bin/python3.9 -m pip install virtualenv
/usr/bin/python3.9 -m virtualenv ~/venv-revizor
source ~/venv-revizor/bin/activate
pip install revizor-fuzzer
```

### 3. Executor

In addition to the Python package, you will need to build and install the executor, which is a kernel module.

```bash
# building a kernel module require kernel headers
sudo apt-get install linux-headers-$(uname -r) linux-headers-generic

# get the source code
git clone https://github.com/microsoft/side-channel-fuzzer.git

# build executor
cd side-channel-fuzzer/rvzr/executor_km
make uninstall  # the command will give an error message, but it's ok!
make clean
make
make install
```

### 4. (Optional) DynamoRIO Backend

If you want to use the DynamoRIO-based model, it has to be installed separately:

```bash
# install dependencies
sudo apt-get install cmake g++ g++-multilib doxygen git zlib1g-dev libunwind-dev libsnappy-dev liblz4-dev

# install DynamoRIO and the model
make -C rvzr/model_dynamorio

# check installation
~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so --list-tracers -- ls
# expected output:
#   ct
#   ...
#   /dev/null
```

### 5. Download ISA spec

```bash
rvzr download_spec -a x86-64 --extensions ALL_SUPPORTED --outfile base.json

# Alternatively, use the following command to include system instructions;
# however, mind that testing these instructions may crash the system if misconfigured!
# rvzr download_spec -a x86-64 --extensions ALL_AND_UNSAFE --outfile base.json
```

### 6. Test the Installation

To make sure that the installation was successful, run the following command:

```bash
./tests/quick-test.sh

# The expected output is:
Detection: OK
Filtering: OK
```

If you see any other output, check if the previous steps were executed correctly.
If you still have issues, please [open an issue](https://github.com/microsoft/side-channel-fuzzer/issues).


### 7. (Optional) System Configuration

External processes can interfere with Revizor's measurements.
To minimize this interference, we recommend the following system configuration:

* Disable Hyperthreading (BIOS option);
* Disable Turbo Boost (BIOS option);
* Boot the kernel on a single core (add `-maxcpus=1` to [Linux boot parameters]((https://wiki.ubuntu.com/Kernel/KernelBootParameters))).

If you skip these steps, Revizor may produce false positives, especially if you use a low value for [`executor_sample_sizes`](../ref/config.md#executor-configuration) for measurements.
However, a large sample size (> 300-400) usually mitigates this issue.


================================================
FILE: docs/intro/03-primer.md
================================================
# Primer: Speculation Contracts and Model-Based Relational Testing

Below is a brief primer on the theoretical foundations of speculation contracts and model-based relational testing—concepts that underlie the Revizor tool. This primer provides a high-level overview of the topic, introducing the concepts of noninterference, speculation contracts, and model compliance.

This document is intended for those new to the topic, particularly people without a background in information-flow analysis. For a more detailed and technical explanation, refer to the [original contracts paper](https://arxiv.org/pdf/2006.03841).

## Information-Flow Properties

We will start with the basics: the concepts of confidentiality and
[noninterference](../glossary.md#noninterference), which are fundamental to understanding how
[speculation contracts](../glossary.md#speculation-contract-aka-leakage-contract) work.

Traditionally, security mechanisms like access control and encryption have focused on protecting
data at rest or in transit. However, these mechanisms do not address the problem of
[**information flow**](../glossary.md#information-flow) within a system.
For example, consider a program that reads a secret input and then writes it to a public output, such as a web server that logs failed login attempts along with the username and masked password entered. Even if the program is secure in the sense that it does not allow unauthorized access to the secret data, it may still leak the secret through its public output, such as logging "User admin failed login with password starting with 'P@ss'" — revealing partial information about the secret password. This is where **information-flow security** comes into play.

Information-flow security is concerned with how data moves through a computation and how it can be observed by an attacker. The goal is to ensure that secret information does not leak to observers who are unauthorized to access it. An **end-to-end confidentiality policy** might be stated as: *“No secret input data can be inferred by an attacker through observations of system output.”* In other words, even if an adversary can see all public outputs of a computation, they should learn nothing about the secret inputs.

**Information-flow properties** generally classify program variables or inputs/outputs into security levels (e.g., `Secret` and `Public`). The key property for confidentiality is that *no information flows from Secret to Public.* But how can information flow? There are two primary routes:

- **Explicit flows:** These occur when confidential data is directly assigned or passed into a public variable or output. For example, in code, writing `public = secret` is an explicit flow from a secret variable to a public variable (an obvious violation of confidentiality). Any mechanism that directly transfers the bits of a secret into a publicly observable sink is an explicit flow. Such flows are usually straightforward to detect.

- **Implicit flows:** These occur indirectly, through the control structure of the program. An implicit flow arises when the *control path* taken by a program (e.g., which branch of an `if` or how many loop iterations) depends on a secret, thereby implicitly leaking information.

=== "Example 1: Implicit Flow"

:   Consider this pseudocode example:

    ```c
    if (Sec == 0) {
        Pub = 0;
    } else {
        Pub = 1;
    }
    ```

    Here `Sec` is a secret input and `Pub` is a public output. There is no direct assignment of `Sec` to `Pub`. However, an observer of `Pub` can deduce information about `Sec`. In fact, this program sets `Pub` to 0 if `Sec` was 0; otherwise, it sets `Pub` to 1—effectively copying the one-bit information “is Sec zero?” into `Pub`. This is an implicit flow of information from `Sec` to `Pub` through the control structure (the `if` condition on `Sec`).


## Noninterference: Definition and Examples

**Noninterference** is a formal property that captures the idea of perfect confidentiality: changes in secret data have *no observable effect* on public outputs. This property can be formalized as: *"a system is noninterferent if variations in Secret inputs cause no differences in Public outputs"*. Equivalently, confidential inputs do not interfere with the publicly visible state of the system.

To make this more concrete, imagine we run a program twice with two different secret inputs but the same public inputs. If **no attacker can distinguish** the two runs by observing anything public, then the program satisfies the noninterference property. The “attacker” here is assumed to have complete access to all public outputs, which are formalized as a function `PublicOut`:

```
output = PublicOut(Sec, Pub)
```

Noninterference essentially demands that for any two secrets `Sec1` and `Sec2` and any public input `Pub`, the program’s behavior from an attacker’s perspective is identical when run on `(Sec1, Pub)` versus `(Sec2, Pub)`:

=== "Definition 1: Noninterference"
:   A program `P` is noninterferent if, for all<br>public inputs `Pub` and all pairs of secret inputs `Sec1`, `Sec2` it holds that <br>`PublicOut(P, Sec1, Pub) = PublicOut(P, Sec2, Pub)`.

Here are some examples to illustrate this principle:

=== "Example 2: Interfering program"

:   Suppose our program simply copies a secret to output:

    ```c
    void copy(int* sec, int* output) {
        *output = *sec;
    }
    ```

:    Running it with two different secrets clearly yields different public outputs (e.g., `output` becomes 5 in one run and 7 in another). An attacker would distinguish these runs, so the program is **not** noninterferent—it blatantly leaks information.

---

=== "Example 3: Noninterfering program"

:   A trivial example of a noninterferent program is one that produces no output dependent on the secret. For instance:

    ```c
    void assign_zero(int* sec, int* output) {
        *output = 0;
    }
    ```

:    This program ignores secret `sec` entirely and always sets the public output `output` to 0. No matter what the secret input is, the public output is constant (0), so an attacker gains no information about `sec`. Indeed, any two runs are indistinguishable (both runs output 0). This satisfies noninterference (albeit by doing nothing useful with the secret).

---

=== "Example 4: Allowed benign dependency"

:   It is possible for a program to use secret data internally yet still be noninterferent as long as the final public outputs don’t reveal those secrets. For instance:

    ```c
    void mask_secret(int* sec, int* output) {
        int temp = *sec;
        temp = temp * 0;   // multiply secret by 0
        *output  = temp;
    }
    ```

:    Here the program *did* read the secret (`sec`) and even manipulated it, but it “washed out” the secret by multiplying by 0. The value assigned to `output` is always 0. From an external view, this is just like the previous example—no dependence of `output` on `sec`. Noninterference is concerned only with *what can be observed by the attacker*, not with whether the program internally used the secret. As long as any use of the secret eventually has no effect on outputs, the policy holds.

:   Naturally, this example is not useful either, as it does nothing with the secret. In practice, however, there are techniques to ensure noninterference while still making use of secret data for useful computations. We won't go into these techniques here as they are beyond the scope of this primer.

---

One important insight is that noninterference is relative to a given specification of what is “observable.” If you consider only the functional outputs as observable, a program might be noninterferent in that model. But if in reality the attacker can observe more (e.g., the execution time of a program), then the program that was secure in theory might be insecure in practice. This leads us to examine how *side channels* break the assumptions of basic noninterference.

## Beyond Direct Outputs: Side Channels

The original works on information-flow properties focused on direct outputs of a program (e.g., writing to a file or a network socket). However, in practice, attackers can extract information from more than just the “official” outputs of a program. For example, the attacker might observe how long a computation takes or measure the power consumption of a device. These additional sources of information are called **side channels**. Side channels are unintended channels through which secret data can be inferred by observing the system’s behavior, even if the direct outputs are secure.

These side channels can reveal information about the secret inputs, and so we must include them in the definition of noninterference. Similarly to how we defined `PublicOut(Sec, Pub)` as the observable output, we can define `Trace` as the observable side-channel information for a given program `P`.

```
trace = Trace(P, Sec, Pub)
```

For example, a trace might be the execution time of the program or its cache access pattern.

Noninterference then requires that the traces of two runs with different secrets - `(Sec1, Pub)` versus `(Sec2, Pub)` - are indistinguishable to an attacker. This is a stronger requirement than just looking at the functional outputs.

=== "Definition 2: Side-Channel Noninterference"
:   Given a side channel that produces a trace `Trace`, a program `P` is noninterferent with respect to this side channel if, for all public inputs&nbsp;`Pub` and all pairs of secret inputs `Sec1`, `Sec2` it holds that <br>`Trace(P, Sec1, Pub) = Trace(P, Sec2, Pub)`.

Here are some examples of side channels and how they can violate noninterference:

=== "Example 5A: Timing side channel"

:   Consider a program that reads a compares a password with a user’s input:

    ```c
    bool check_password(const char *attempt, const char *pswd) {
        for (int i = 0; i < length(pswd); i++) {
            if (attempt[i] != pswd[i]) {
                return false;  // mismatch found, return early
            }
        }
        return true; // all characters matched
    }
    ```

:   If the attacker can measure how long the function takes to reject a guess, they can infer the password one character at a time. This leakage surfaces as a violation of the noninterference property with respect to timing observations.

:   A counterexample to Definition 2 could be as follows: Let's say we use the same input on two different secrets:

:   - `input1={attempt="aaa", pswd="abc"}`
:   - `input2={attempt="aaa", pswd="aab"}`

:   The traces of these inputs will be:

:   - `trace1 = Trace(check_password, input1) = 1`
:   - `trace2 = Trace(check_password, input2) = 2`

:   These inputs constitute a violation of Definition 2, as `trace1 != trace2` even though the two inputs have the same public values.

---

=== "Example 5B: Timing side channel - Password length"

:   Noninterference is able to model different kinds of secret-dependent leaks. Let's take for example a patched version of the previous program:

    ```c
    bool check_password(const char *attempt, const char *pswd) {
        int len = min(length(attempt), length(pswd));
        bool same = true;
        for (int i = 0; i < len; i++) {
            same = same && (attempt[i] == pswd[i]); // all the loop is executed
        }
        return same;
    }
    ```

:   In this version there is no early-exit condition, yet the attacker is still able to infer the _length_ of the password through a side-channel. This is captured by the following counterexample:

:   - `input1={attempt="aaaaaa", pswd="b"}`, `trace1 = 1`
:   - `input2={attempt="aaaaaa", pswd="bbb"}`, `trace2 = 3`

:   Which shows that the program still violates Definition 2.

---

=== "Example 6: Cache side channel"

:   Consider a program that uses a secret value to index into an array, as in the following code:

    ```c
    int multiply(const char *array, int pub, int sec) {
        char x = array[sec];
        return x * pub;
    }
    ```

:   A co-located attacker could observe the cache access pattern of the program by using Prime+Probe or Flush+Reload attack. Such traces can reveal the addresses accessed by the program and thus leak the secret value. This leakage would violate the noninterference property with respect to cache observations.

:   A violation could be surfaced by two inputs:

:   - `input1={array=0x10000, pub=1, sec=0x40}`
:   - `input2={array=0x10000, pub=1, sec=0x80}`

:   Let's assume that the cache line size is 64 bytes, and the cache is direct-mapped, meaning that the cache line ID is based on the memory access address `addr` as `line_id = (addr % 0x1000) // 0x40`. Since the array access in the first line of `multiply` will access two different addresses for the two inputs, they will also produce two different traces:

:   - `trace1 = Trace(multiply, input1) = ((0x10000 + 0x40) % 0x1000) // 0x40 = 1`
:   - `trace2 = Trace(multiply, input2) = ((0x10000 + 0x80) % 0x1000) // 0x40 = 2`

:   Since we have two inputs that match on the secret value `sec` but differ on the cache trace, this constitutes a violation of Definition 2.

## Challenges of Side-Channel Noninterference

Despite its completeness, the above formalization of side-channel noninterference is too simplistic to faithfully capture the side effects of program execution on modern, highly optimized hardware, especially CPUs. There are two key challenges:

- *Challenge 1 - Noisy and Non-Deterministic Traces*: The traces observed by the attacker over a side channel are typically noisy, non-deterministic, and depend on the microarchitectural state of the CPU. For example, cache access patterns can be influenced by other programs running on the machine, the operating system and its interrupts, and can depend on microarchitectural buffers like store buffers or branch history tables. This means that the `Trace` function is not a simple deterministic function of the program inputs, but a complex function of many factors, some of which affect the result concurrently and in a non-deterministic fashion.

- *Challenge 2 - Unknown Side Channels*: Modern CPUs have a plethora of side channels, including cache timing, branch prediction, and many others. To ensure complete confidentiality, we need to check that the program does not leak information over *any* of them. This is a challenging task, as we do not know the full set of possible side channels when it comes to commercial hardware with proprietary microarchitectures. For example, a CPU might have an obscure microarchitectural optimization that vastly expands possibilities for information leaks, as was the case with Spectre and Meltdown vulnerabilities. Not including this optimization will undermine the noninterference analysis. Therefore, to test for noninterference comprehensively, we need a way to discover and reason about all possible side channels that could leak information.

The next two sections discuss how speculation contracts address these challenges.

## Speculation Contracts: Dealing with the Complexity of Modern Hardware

As a solution to the first challenge, Guarnieri et al. (2021) introduced the concept of **speculation contracts**. A speculation contract is a simplified and deterministic model of the hardware, designed to capture the information that a given program *could* leak over side channels when executed with the given inputs. The key term here is "could"—the contract is not meant to exactly predict the side-channel traces, but instead, it errs on the side of caution, overestimating the possible leaks to achieve deterministic and noise-free traces.

A speculation contract works by defining two key aspects for every instruction in the CPU's ISA:

1. [**Observation Clause**](../glossary.md#observation-clause): For each instruction that may have
an observable side effect, the contract declares an observation clause. It describes the data
exposed by the instruction.

2. [**Execution Clause**](../glossary.md#execution-clause): For each instruction whose semantics
may be affected by hardware optimizations (e.g., speculative execution), the contract declares an
execution clause. It describes the effect of such optimizations, but without specifying the exact
mechanism of the optimization.

At a high level, a contract implements a function `ContractTrace` that maps a program `P` and its
inputs `Sec, Pub` to a [contract trace](../glossary.md#contract-trace-ctrace) `ctrace`. It is
essentially a conservative approximation of the `Trace` function.

```
ctrace = ContractTrace(P, Sec, Pub)
```

The contract trace is a sequence of all data that is exposed when a program is executed according
to a contract. It captures the side-channel observations that *could be visible* if the CPU
followed the speculation contract's rules for a given program execution.

Accordingly, the noninterference property is redefined in terms of the contract trace:

=== "Definition 3: Contract Noninterference"

:   Given a contract that produces a contract trace&nbsp;`ContractTrace`, a program `P` is noninterferent with respect to this contract if,<br>for all public inputs&nbsp;`Pub` and all secret inputs `Sec1`, `Sec2`, it holds that <br>`ContractTrace(P, Sec1, Pub) = ContractTrace(P, Sec2, Pub)`.

The following examples illustrate how a contract can be used to model side-channel leaks on a CPU.

=== "Example 7: Memory Observation Contract, MEM-SEQ"

:   Let's imagine a CPU with a shared data cache and no other optimizations (i.e., no speculation). A co-located attacker can recover the addresses of loads/stores by observing which of the cache sets changed their state via a cache timing side-channel attack (e.g., Prime+Probe). We can encode these expectations in an observation clause for loads and stores by specifying that they expose their address. Since the CPU does not speculate, the execution clause for all instructions is empty. We call this contract MEM-SEQ (memory leakage with sequential execution), and it can be summarized as a table:

    |       | Observation Clause | Execution Clause |
    | ----- | ------------------ | ---------------- |
    | Load  | Expose Address     | -                |
    | Store | Expose Address     | -                |
    | Other | -                  | -                |

:   Note that MEM-SEQ intentionally overestimates the leaks by assuming that the attacker observes complete addresses loads/stores (in contrast to a subset of bits that are actually leaked in practice) and that *all* loads/stores are observable (in reality, they might be masked by noise or other factors). This overestimation is intentional to ensure that the contract is conservative and captures all possible corner cases.

:   Let's now consider how we can produce a contract trace using MEM-SEQ. We will use a slightly modified version of the `multiply` function from Example 6:

    ```c
    int multiply(const char *array, int pub, int sec) {
        char x = array[sec];   // MEM-SEQ exposes: &array[sec]
        char y = array[pub];   // MEM-SEQ exposes: &array[pub]
        return x * y;
    }
    ```

:   The inputs are:

:   - `input1 = {array=0x10000, pub=1, sec=2}`
:   - `input2 = {array=0x10000, pub=1, sec=3}`

:   The model collects a trace by executing the program line-by-line according to the rules in the table above (in practice, this is usually done using a modified CPU emulator). The first line has a load from memory, so the model records the address `&array[sec]` as exposed. The second line has another load, so the model records the address `&array[pub]` as exposed. The contract traces for this program would be:

:   - `ctrace1 = ContractTrace(multiply, input1) = [0x10002, 0x10001]`
:   - `ctrace2 = ContractTrace(multiply, input2) = [0x10003, 0x10001]`

:   Finally, this model can be used to check for noninterference by comparing contract traces according to Definition 3. In this case, we have two inputs with matching public values and different secrets, and they produced different contract traces, `ctrace1 != ctrace2`. This constitutes a violation and means that the `multiply` function is not noninterferent with respect to MEM-SEQ.

---

=== "Example 8: Branch Prediction Contract, MEM-COND"

:   Now let's consider a more complex scenario, with a CPU that implements branch prediction—a common form of speculative execution. In this case, the CPU may incorrectly predict branch targets and execute instructions that are not part of the correct control flow. We can model this behavior in a contract by introducing an execution clause for conditional jumps that specifies the mispredicted target. To make the example useful, we will assume that the CPU also has a data cache, so the observation clause for loads and stores remains the same as in MEM-SEQ. We call this contract MEM-COND (memory leakage with conditional branch misprediction).

    |            | Observation Clause | Execution Clause  |
    |------------|--------------------|-------------------|
    | Load       | Expose Address     | -                 |
    | Store      | Expose Address     | -                 |
    | Cond. Jump | -                  | Mispredict Target |
    | Other      | -                  | -                 |

:   As a target program we will use the following function:

    ```c
    int conditional_multiply(char *array, int pub, int sec) {
        int z = array[pub];   // MEM-COND exposes: &array[pub]
        if (z < 10) {         // MEM-COND mispredicts (assume z = 10)
            z *= array[sec];  // MEM-COND exposes: &array[sec]
        }
        return z;
    }
    ```

:   and a pair of inputs with the same public value but different secrets:

:   - `input1 = {array=0x10000, pub=1, secret=2}`
:   - `input2 = {array=0x10000, pub=1, secret=3}`

:   The first line of `conditional_multiply` has a load, so it exposes its address, `&array[pub]`. For the sake of this example, let's assume this load returns `10`, so the next branch is not supposed to be taken. However, according to MEM-COND, branches take the wrong target, so the model executes the third line anyway. This line is a load, so it exposes the address `&array[sec]`. After this, the program terminates, and the resulting traces are:

:   - `ctrace1 = ContractTrace(conditional_multiply, input1) = [0x10002, 0x10001]`
:   - `ctrace2 = ContractTrace(conditional_multiply, input2) = [0x10003, 0x10001]`

:   Again, the traces are different, so the program violates noninterference with respect to MEM-COND.
:   Notably, however, these two inputs would *not* violate noninterference with respect to MEM-SEQ, as the branch at line 2 would not be mispredicted, and the traces would be identical:

:    `ctrace_mem_seq1 = ctrace_mem_seq2 = [0x10001]`

## Building and Testing Speculation Contracts

Speculation contracts are typically built by hand, with the initial versions based on public knowledge of the CPU's microarchitecture and its side-channel vulnerabilities. However, in the case of commercial CPUs, the exact details of the microarchitecture are often proprietary and not publicly disclosed. In these cases, the contract could—and often will—be incomplete. This is where the testing of speculation contracts becomes crucial: the initial "draft" of a contract is tested against the real hardware to ensure that it captures all side-channel leaks that the CPU exhibits. If the contract misses something, it is refined based on the results of the testing, and the process is repeated until the contract is deemed safe to use.

But how do we test a speculation contract? A naive approach might be to directly compare the traces produced by the model with the traces collected from the real CPU for the same program and inputs. However, this approach is generally not feasible because the contract traces intentionally overestimate the hardware traces, so mismatches are expected. Moreover, the model might expose information differently than the real hardware (e.g., the model might expose load/store addresses, while the hardware exposes cache set indexes), meaning direct comparison is often impossible.

Instead, a more precise approach is to compare *the information contained in the traces*. The idea is to check that the information exposed by the model is a strict superset of the information exposed by the real hardware. This is done by verifying that all inputs producing identical contract traces for a given program also produce identical hardware traces. If this property holds for all possible programs and inputs (ignore the complexity question for now), then any program that would be noninterferent with respect to the real hardware is guaranteed to be noninterferent with respect to the speculation contract. At this point, the model is safe to use as a proxy for real hardware when analyzing side-channel leaks.

To formalize this idea, let's introduce a new function `HardwareTrace` to denote the
[hardware trace](../glossary.md#hardware-trace-htrace) collected from the real hardware, and it
will take an extra argument `Ctx` to capture the fact that real-world hardware traces depend on
the microarchitectural state (e.g., on the state of branch predictors or caches).

=== "Definition 4: [Contract Compliance](../glossary.md#contract-compliance)"

:   A CPU complies with a speculation contract if, for all programs `P`, all input pairs
`(Sec1, Pub), (Sec2, Pub)`, and all initial microarchitectural states&nbsp;`Ctx`, if
`ContractTrace(P, Sec1, Pub) = ContractTrace(P, Sec2, Pub)`, then
`HardwareTrace(P, Sec1, Pub, Ctx) = HardwareTrace(P, Sec2, Pub, Ctx)`.


and conversely

=== "Definition 5: [Contract Violation](../glossary.md#violation)"

:   A CPU violates a speculation contract if there exists a program&nbsp;`P`, a microarchitectural
state&nbsp;`Ctx`, and two inputs `(Sec1, Pub), (Sec2, Pub)` such that
`ContractTrace(P, Sec1, Pub) = ContractTrace(P, Sec2, Pub)` and <br>
`HardwareTrace(P, Sec1, Pub, Ctx) != HardwareTrace(P, Sec2, Pub, Ctx)`.

We call the tuple `(P, Ctx, Sec1, Sec2)` a
[**contract counterexample**](../glossary.md#violation-artifact-aka-contract-counterexample). The
counterexample demonstrates that an adversary can learn more information from hardware traces than
what the contract specifies. A counterexample indicates a potential microarchitectural leakage
that was not accounted for by the contract. The goal of Revizor is to find such counterexamples.

## [Model-Based Relational Testing](../glossary.md#model-based-relational-testing-mrt) and Revizor

Revizor applies the principles above, and provides a framework for building executable speculation
contracts together with a mechanism to test real hardware (currently only CPUs) against these
contracts by searching for contract counterexamples, as in Definition 5. However, there are
certain issues that appear when the theory from the previous section is applied in practice, which
we had to address in Revizor.

The first issue is the search space: testing all possible programs and inputs is literally
impossible. We mitigate this issue by relying on a sampling-based approach, similar to fuzzing,
where we approximate the complete search space via random sampling. Specifically, Revizor generates
small (50-100 instructions long) programs, creates random inputs for them, collects both the
contract and hardware traces for these inputs, and checks whether any of the traces constitute a
contract counterexample. This process is called
[*Model-based Relational Testing*](../glossary.md#model-based-relational-testing-mrt), and it is
detailed further in the [Architecture Overview](../internals/architecture/overview.md).

This approach works well in practice because any given hardware optimization can typically be triggered by many different programs, and we need to find only one instance to detect a violation. Evidence of this is the [list of trophies](https://microsoft.github.io/side-channel-fuzzer/) that Revizor has already amassed.

The second issue we encountered is nondeterminism. As mentioned earlier, hardware traces can be non-deterministic due to various factors like interrupts or other programs running on the machine. To handle this, we use statistical methods: Revizor collects hardware traces for each program-input pair multiple times and then compares their distributions. If the distributions of the traces are statistically similar, Revizor considers the traces to be equivalent. This approach helps us account for noise in the hardware traces while still making reliable decisions about contract compliance.

For more details, see [Architecture Overview](../internals/architecture/overview.md).

## Conclusion

In this primer, we have introduced the concepts of noninterference, side channels, and speculation contracts, which all underlie the design of Revizor:

- The hardware fuzzer in Revizor uses speculation contracts and the concepts of noninterference (1) to detect unexpected side channels and dangerous microarchitectural optimizations in commercial CPUs, and (2) to aid in building sound leakage models for those CPUs.
- The software fuzzer in Revizor (*NOTE: currently under construction*) uses the leakage models produced by the hardware fuzzer, and applies the principles of noninterference testing to detect side-channel vulnerabilities in real-world software.

With these two components, we aim to provide a comprehensive tool for discovering and mitigating side-channel vulnerabilities software that can handle even the most obscure and complex microarchitectural optimizations in modern hardware.

---

## Sources and Further Reading

- A. Sabelfeld and A. C. Myers. *Language-Based Information-Flow Security*. IEEE Journal on Selected Areas in Communications, 21(1), 2003. (Survey of information-flow security, implicit/explicit flows, covert channels, etc.)
- J. A. Goguen and J. Meseguer. *Security Policies and Security Models*. IEEE Symposium on Security and Privacy, 1982. (Origin of noninterference as a security policy formalism.)
- J. B. Almeida et al. *Verifying Constant-Time Implementations*. USENIX Security Symposium, 2016. (Constant-time programming principles and the ct-verif tool for automated verification.)
- M. Guarnieri, B. Köpf, J. Reineke, P. Vila. *Hardware-Software Contracts for Secure Speculation*. IEEE Symposium on Security and Privacy, 2021. (Original paper on speculation contracts.)
- O. Oleksenko, C. Fetzer, B. Köpf, M. Silberstein. *Revizor: Testing Black-box CPUs against Speculation Contracts*. ACM International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS), 2022. (Paper describing Model-based Relational Testing and Revizor.)


================================================
FILE: docs/intro/04-tutorials.md
================================================
# Starting with Tutorials

Let's learn by example.

This is a starting point for a tutorial series that will teach you how to use Revizor for testing CPUs, from the most basic cases, to detection of Spectre and Meltdown, to building custom campaigns for detecting new vulnerabilities, and up to building custom extensions for Revizor for the most advanced cases.

!!! note "Prerequisites"
    Before proceeding with this tutorial, ensure that you have completed the installation steps outlined in the [Installation Guide](02-install.md).

!!! question "Need Help?"
    - **Questions about the tutorial?** Check the [FAQ](../faq/general.md) or open a [GitHub discussion](https://github.com/microsoft/side-channel-fuzzer/discussions)
    - **Found a bug?** Report it in [GitHub issues](https://github.com/microsoft/side-channel-fuzzer/issues)

### Let's get started!

Ready to dive in?

* [Tutorial 1](./tutorials/01-first-fuzz.md) - run your first fuzzing campaign with Revizor
* [Tutorial 2](./tutorials/02-first-vuln.md) - find your first microarchitectural vulnerability with Revizor
* [Tutorial 3](./tutorials/03-faults.md) - learn how to test faults and exceptions with Revizor
* [Tutorial 4](./tutorials/04-isolation.md) - explore how to test domain isolation boundaries
* [Tutorial 5](./tutorials/05-extending.md) - extend Revizor with custom features


================================================
FILE: docs/intro/start-here.md
================================================
# Getting started

New to Revizor? Or to side-channel testing in general? You came to the right
place: read this material to quickly get up and running.

## Introductory Materials

* [Revizor at a Glance](01-overview.md): Understand what Revizor is, what problems it solves, and see a quick example of violation detection.
* [Installation Guide](02-install.md): Get Revizor installed on your system and verify your setup.
* [Core Concepts](03-primer.md): Learn about contracts, traces, speculation, and other fundamental concepts needed to use Revizor effectively.
* [Tutorial Series](04-tutorials.md): Follow a series of hands-on tutorials that walk you through running your first tests, detecting violations, and rump up all the way to root-cause analysis and design of custom campaigns.
* [Glossary](../glossary.md): A quick reference for key terms used throughout the documentation.

## Research

Interested in the academic research behind Revizor? Check out the papers listed in the [Research Papers](../ref/papers.md) section.

## Need Help?

[Ask a Question](../howto/ask-a-question.md) about Revizor if you need assistance or have any questions.


================================================
FILE: docs/intro/tutorials/01-first-fuzz.md
================================================
# Tutorial 1: Your First Fuzz

This is the first part of the tutorial on the basic usage of Revizor.

### Overview

In this first tutorial, we'll start with a baseline experiment to verify your Revizor installation and familiarize yourself with the basic workflow. This tutorial walks you through a simple fuzzing campaign that should find no violations.

The goal of this first campaign is verification, not vulnerability detection. We'll deliberately choose an instruction set that should not trigger speculation on Intel or AMD CPUs—specifically, simple arithmetic operations without any branches or memory speculation sources. Since there are no conditional branches to mispredict and no page faults to speculate around, we expect the CPU to execute sequentially without any speculative side effects.

This baseline is useful for two reasons. First, it confirms your installation is working correctly. If the fuzzer crashes or behaves unexpectedly, you'll know there's a setup issue rather than discovering problems later during more complex campaigns. Second, it establishes what "no violations" looks like, so you can recognize the difference when you do find a vulnerability in the next tutorial.

### Create your first configuration file

Revizor's behavior is controlled by a YAML configuration file that specifies which instructions to test and what contract to check against. Create a file named `config.yaml` with the following content:

```yaml
# tested instructions
instruction_categories:
  - BASE-BINARY

# prevent branch generation
max_bb_per_function: 1
min_bb_per_function: 1

# contract
contract_observation_clause: loads+stores+pc
contract_execution_clause:
  - no_speculation
```

Let's understand each section. The `instruction_categories` field tells Revizor which instructions to include in generated test cases. We're using `BASE-BINARY`, which includes only arithmetic and logical operations like `add`, `sub`, `and`, `xor`, and `mov`. These operations are data-processing instructions that don't involve control flow or special memory access patterns.

The `max_bb_per_function` and `min_bb_per_function` settings both set to 1 ensure that Revizor generates programs with exactly one basic block—meaning no branches at all. This simplifies our test cases to pure arithmetic sequences, eliminating any possibility of branch misprediction.

The contract configuration section is set to use the simplest contract, CT-SEQ. This contract assumes nothing about the target CPU except the presence of CPU caches, making it a zero-knowledge baseline for detecting unknown vulnerabilities. With CT-SEQ, Revizor reports any information leaks beyond the most trivial non-speculative cache accesses.

For a complete reference of all configuration options, see the [Configuration Reference](../../ref/config.md).


### Run the Campaign

Let's run the fuzzer with your baseline configuration:

```bash
rvzr fuzz -s base.json -c config.yaml -n 100 -i 50 -w .
```

This command tells Revizor to execute 100 test cases (`-n 100`) with 50 inputs per test case (`-i 50`), using the ISA specification from `base.json` and your configuration file. The `-w .` flag specifies the working directory for saving any violations.

You'll see output similar to this:

```
INFO: [fuzzer] Starting at 14:32:18
100   (100%)| Stats: Cls:50/50,In:100,R:5,SF:0,OF:0,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0,V:0
================================ No Violations detected ===========================
```

The campaign should complete in under a minute with no violations detected. This is exactly what we expect—our simple arithmetic instructions don't trigger speculation, so the hardware behaves according to the strict sequential contract.

### Interpret the statistics

Let's examine the statistics line to understand what Revizor is reporting:

```
100   (100%)| Stats: Cls:50/50,In:100,R:5,SF:0,OF:0,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0,V:0
```

#### `100 (100%)`

This part shows we completed all 100 test cases. This number was continuously updated while the fuzzer was running.

#### `Cls:50/50`

These numbers indicate the number of [equivalence classes](../../glossary.md#contract-equivalence-class) formed by the inputs. The first number is the effective classes (> 1 input per class) and the second is the total number of classes.

If you don't understand what all of this means, that's ok. The only important factors are:

- if both numbers are equal (or at least close), and they are also equal to the number of inputs that you've set via `-i` command-line argument: everything is going well.
- if the numbers are different, it means either a misconfiguration or an issue with the input generator. Ensure that `input_per_class` config option is `> 1`.
- if the numbers are equal, but they are both considerably lower than the number of inputs set via `-i`: You're using an overly simple fuzzing configuration, and you're unlikely to find anything with it.

None of the issues above should happen if you're using the config file from this tutorial. If they do, double-check your installation.

#### `R:5`

This is an indirect indicator of the level of noise on the system. More concretely, it is the average sample size used by the executor. It is an adaptive number, which increases when the tool starts to encounter false positive caused by noise.

This number should be relatively small. If you see that it's going above 10-20 range, it is likely because something is polluting the measurements. Consider applying the suggestions [here](../02-install.md#7-optional-system-configuration).

#### `SF:0,OF:0,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0`

These numbers are the statistics on the effectiveness of various optimizations used by Revizor, such as speculation and observation filtering.

You can ignore these numbers for now, as they are useful only when you're trying to optimize performance of the fuzzer. If you're still curious, though, see the [Fuzzing Statistics Reference](../../ref/runtime-statistic.md).

### Understand what this means

The successful completion of this baseline campaign tells you several things. Your Revizor installation is working correctly—the fuzzer can generate test cases, execute them on your hardware, collect traces, and analyze the results. Your system is stable enough for fuzzing—there's no excessive noise preventing measurement. The kernel module loaded correctly and can execute test programs in the sandbox environment.

!!! success "Setup Verified"
    If you've successfully completed this baseline campaign with no violations, your Revizor installation is ready for real vulnerability detection. You can now proceed to Tutorial 2 with confidence.

!!! warning "Troubleshooting Common Issues"
    If the fuzzer crashes or produces errors, check these common problems:

    **Module not loaded**: Ensure the kernel module is loaded with `lsmod | grep rvzr_executor`. If not, run `cd rvzr/executor_km && make && sudo make install`.

    **Permission denied**: Revizor needs root privileges to access performance counters. Check that your user account on the system has `sudo` privileges.

    **ISA specification missing**: If you see "base.json not found", run `rvzr download_spec` first to download the instruction set specification.

### What's Next?

You've finished the first tutorial. Congrats!

If you're ready to go further and start detecting violations, proceed to [Tutorial 2](./02-first-vuln.md).


================================================
FILE: docs/intro/tutorials/02-first-vuln.md
================================================
# Tutorial 2: Detecting Your First Vulnerability

This tutorial is the first step into actual vulnerability detection. You'll learn how to set up a fuzzing campaign that tests conditional branches. And, most likely, it will end with a detection of Spectre V1.

### Testing Workflow

Before we begin with actual testing, let's take a step back and consider how a typical testing workflow looks like.

The process of using Revizor normally constitutes of the following steps:

1. **Design the campaign** by selecting which instructions to test and choosing an appropriate contract that defines what behavior we consider a violation.
2. **Create a configuration file** that captures these decisions.
3. **Run the fuzzer** to generate and execute random test cases.
4. **Validate the violation** to ensure it's genuine and not a false positive.
5. **Minimize the test case** to remove unnecessary complexity, making it easier to understand.
6. **Analyze the minimized program** to identify the root cause of the vulnerability.

In the following, we will go step-by-step through this workflow.

### Plan the campaign

Let's imagine we have a new CPU and want to determine if conditional branches produce any information leakage on it. These instructions are infamous for causing Spectre V1, therefore it is always useful to start with them when testing a new CPU.

The first step is planning our fuzzing campaign strategically.

For effective testing, we'll focus on a minimal instruction subset rather than the entire ISA. Spectre V1 requires only two capabilities: conditional branches (to trigger misprediction) and memory accesses (to leak information through side channels). By limiting our instruction set to just arithmetic operations and conditional branches, we accomplish two goals. First, the fuzzer will find violations faster because there are fewer instruction combinations to explore. Second, when we do find a violation, it will be much easier to analyze because the test case will be simpler.

!!! warning
    Note that this focused approach is *not* representative of a real fuzzing campaign. This tutorial is intentionally simplified to help with understanding. In a real campaign, you'll need to find balance between having a broad scope (increases changes of finding unknown vulnerabilities) and having focus on specific CPU features (simplifies root-cause analysis). For more guidance on campaign design, see [How to Design a Fuzzing Campaign](../../howto/design-campaign.md).

We'll pair this minimal instruction set with the strictest possible contract—one that forbids any speculation whatsoever. This means Revizor will flag any speculative behavior as a violation. While this contract is more restrictive than what modern CPUs actually guarantee, it's perfect for our purposes. Since we're only testing conditional branches and simple arithmetic, any speculation we detect will almost certainly be Spectre V1.

With this campaign plan, we are trying to answer a specific question: "Does this CPU leak information through conditional branches?"

### Create the configuration file

Now that we've planned our campaign, let's translate it into a configuration file. Create a YAML file with the following content:

```yaml
# tested instructions
instruction_categories:
  - BASE-BINARY
  - BASE-COND_BR

# contract
contract_observation_clause: loads+stores+pc
contract_execution_clause:
  - no_speculation

# enable perf. optimizations
enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true
```

The `instruction_categories` section implements our decision to use a minimal instruction set. We're including `BASE-BINARY` for arithmetic operations like addition and comparison, and `BASE-COND_BR` for conditional branches like `jz` and `jne`. These two categories give the fuzzer everything it needs to express Spectre V1 patterns.

The contract configuration consists of two clauses. The `contract_observation_clause` tells Revizor what microarchitectural side effects to track. We're using `loads+stores+pc`, which observes memory access addresses and the program counter—exactly what an attacker would monitor through cache timing attacks. The `contract_execution_clause` defines what execution behavior is allowed. By setting it to `no_speculation`, we're telling Revizor that any speculative execution is a violation.

The performance optimization flags at the bottom significantly speed up fuzzing without affecting correctness. The `enable_speculation_filter` skips test cases that don't trigger speculation at all. The `enable_observation_filter` skips test cases that leave no observable traces. The `enable_fast_path_model` allows Revizor to reuse contract traces across similar inputs, reducing the model execution overhead.

For a complete reference of all configuration options, see the [Configuration Reference](../../ref/config.md).

### Run the fuzzer

Now we're ready to start fuzzing. Run Revizor with the following command:

```
./revizor.py fuzz -s base.json -c config.yaml -n 1000 -i 10 -w .
```

This command tells Revizor to run 1000 test cases (`-n 1000`), with 10 inputs per test case (`-i 10`), using the ISA specification from `base.json` (`-s`) and our configuration file (`-c`). The `-w .` flag tells Revizor to save any violations it finds to the current directory.

As the fuzzer runs, you'll see a continuously updating progress line:

```
50    ( 5%)| Stats: Cls:10/10,In:20,R:7,SF:38,OF:6,Fst:6,CN:0,CT:0,P1:0,CS:0,P2:0,V:0
```

### View the detected violation

After a minute or so, you should see a violation.
It will be reported in a format similar to this:

```
================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:4   | ID:14 |
-----------------------------------------------------------------------------------
^......^...^........^.................^...........^............. | 626    | 0     |
^......^...^........^........................................... | 1      | 18    |
^^.....^...^........^....^...................................... | 0      | 609   |

```

Excellent! We've successfully detected a contract violation. Let's understand what this violation report is telling us.


The report shows us the violation details in a table format. The header row displays the input IDs that triggered the violation—in this case, inputs 4 and 14:

`| ID:4   | ID:14 |`

These are two inputs from our test case that the contract predicted would behave identically, but the hardware traces show they behaved differently.

The three rows below show the different hardware traces that were observed:

```
^......^...^........^.................^...........^.............
^......^...^........^...........................................
^^.....^...^........^....^......................................
```

Each row represents a distinct cache access pattern, visualized as a bitmap where `^` marks an accessed cache line and `.` marks an untouched cache line. We're using Prime+Probe cache side channel measurements (default), so each position in the bitmap corresponds to one of the 64 cache sets in the L1D cache. (A cache set is a group of cache lines that compete for the same position in the cache—when the CPU accesses memory at a particular address, the data goes into a specific cache set determined by the address bits.)

For example, the first trace reads like this:

```
Cache Set 0 accessed
|          Cache Set 11 accessed
|          |                          Cache set 38 accessed
|          |                          |
^......^...^........^.................^...........^.............
       |            |                             |
       |            |                             Cache Set 50 accessed
       |            Cache Set 20 accessed
       Cache Set 7 accessed
```

Finally, the numbers in the columns tell us how often each trace appeared for each input:

```
... | 626    | 0     |
... | 1      | 18    |
... | 0      | 609   |
```

Looking at the first hardware trace we see it appeared 626 times for input 4 but never for input 14. The third trace shows the opposite pattern—0 times for input 4 but 609 times for input 14. This clear separation in the distributions confirms this is a genuine violation, not random noise.

What we're seeing is a data-dependent cache access pattern. The test case accessed different cache lines depending on the input data, creating an observable side channel. We don't know yet what caused this channel, but we can already tell that it's likely to be caused by speculation; non-speculative cache accesses are permitted by our reference contract, so they wouldn't be reported as violations.

For more details on interpreting violation reports, see [How to Interpret Violation Results](../../howto/interpret-results.md).

### Violation Artifact

The artifact for this violation is stored in a directory named `violation-<timestamp>`:

```bash
$ ls -l violation-251203-103338
input_0000.bin  input_0004.bin  input_0008.bin  input_0012.bin  input_0016.bin  minimize.yaml    reproduce.yaml
input_0001.bin  input_0005.bin  input_0009.bin  input_0013.bin  input_0017.bin  org-config.yaml
input_0002.bin  input_0006.bin  input_0010.bin  input_0014.bin  input_0018.bin  program.asm
input_0003.bin  input_0007.bin  input_0011.bin  input_0015.bin  input_0019.bin  report.txt
```

The `program.asm` file holds the test case program that triggered the violation. The `input_*.bin` files contain the input sequence that exposed the leak. The `report.txt` file provides additional details including hardware and contract traces. The configuration files include `org-config.yaml` (the original configuration), `reproduce.yaml` (for reproducing the violation), and `minimize.yaml` (for test case minimization).

### Validate the violation

Let's verify this violation is genuine and reproducible. First, we'll move the violation artifacts to a simpler path:

```bash
mv violation-251203-103338 ./violation
```

Now we'll reproduce the violation using the saved artifacts:

```bash
./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/program.asm -i ./violation/input*.bin
```

If the violation is genuine, we should see Revizor report it again:

```
================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:4   | ID:14 |
-----------------------------------------------------------------------------------
^......^...^........^.................^...........^............. | 626    | 0     |
^......^...^........^........................................... | 1      | 20    |
^^.....^...^........^....^...................................... | 0      | 607   |
```

Perfect! The hardware traces are roughly the same as before, confirming this is a stable, reproducible violation.

!!! tip "Dealing with False Positives"
    In most cases, violations are genuine. However, if you're on a high-noise system, you might occasionally see non-reproducible violations. If this happens, adjust the noise tolerance by increasing `analyser_stat_threshold` or `executor_sample_sizes` in your configuration file (see the [Configuration Reference](../../ref/config.md) for details), then rerun the fuzzer. Also, consider trying to mitigate the noise, for example by disabling hyperthreading or by turning prefetchers off.


### Minimize the test case

Now that we've confirmed the violation is real, let's simplify it for easier analysis. The minimizer will systematically remove unnecessary instructions while keeping the violation reproducible.

Use the following command. We won't go into it's details now as they are irrelevant to this tutorial. If you're curious, check our [How to Minimize](../../howto/minimize.md) guide.

```bash
./revizor.py minimize -s base.json \
    -c ./violation/minimize.yaml -t ./violation/program.asm \
    -o ./violation/min.asm -i 10 --num-attempts 3 \
    --enable-instruction-pass 1 \
    --enable-simplification-pass 1 \
    --enable-nop-pass 1 \
    --enable-constant-pass 1 \
    --enable-mask-pass 1 \
    --enable-label-pass 1
```

We'll see the minimization progress as it works through multiple passes:

```
[PASS 1] Reproducing the violation
  > Violation reproduced. Proceeding with minimization
  > Violating input IDs: [4, 14]
[INFO] Minimization attempt 1/3
[PASS 2] Instruction Removal Pass

........---...--
[PASS 3] Instruction Simplification Pass

--..-
[PASS 4] NOP Replacement Pass

(and so on...)
```

This process typically takes 5-10 minutes. Each `.` indicates a failed removal attempt (the violation disappeared), while each `-` shows a successful simplification (the violation persisted with fewer instructions). After it finishes, we'll find the minimized program in `./violation/min.asm`.

``` asm
.intel_syntax noprefix
.section .data.main
.function_0:
.macro.measurement_start: nop qword ptr [rax + 0xff]
add al, -118 # instrumentation
and rdi, 0b1111111111100 # instrumentation
adc al, byte ptr [r14 + rdi]
mov rax, -1332388169
imul eax, eax, -75
and rcx, 0b1111111111000 # instrumentation
add dword ptr [r14 + rcx], eax
and rax, 0b1111111111000 # instrumentation
imul qword ptr [r14 + rax]
and rcx, 0b1111111000000 # instrumentation
lock inc qword ptr [r14 + rcx]
and rdi, 0b1111111111000 # instrumentation
add byte ptr [r14 + rdi], al
sub dl, al
jp .bb_0.1
jmp .exit_0
.bb_0.1:
and rbx, 0b1111111111000 # instrumentation
cmp dword ptr [r14 + rbx], eax
and rdi, 0b1111111111000 # instrumentation
cmp qword ptr [r14 + rdi], rbx
and rbx, 0b1111111000000 # instrumentation
lock sub word ptr [r14 + rbx], dx
and rbx, 0b1111111111000 # instrumentation
dec word ptr [r14 + rbx]
and rsi, 0b1111111111000 # instrumentation
neg qword ptr [r14 + rsi]
and rbx, 0b1111111111000 # instrumentation
adc ax, word ptr [r14 + rbx]
.exit_0:
.macro.measurement_end: nop qword ptr [rax + 0xff]
.section .data.main
.test_case_exit:nop
```

Let's verify the minimized program still triggers the violation:

``` bash
$ ./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/min.asm -i ./violation/input*.bin

INFO: [prog_gen] Setting program_generator_seed to random value: 112509

INFO: [fuzzer] Starting at 11:04:52
> Entering slow path...> Priming  1             > Increasing sample size... to 50> Increasing sample size... to 100> Increasing sample size... to 500> Priming  1

================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:5   | ID:15 |
-----------------------------------------------------------------------------------
^^................^..^.......................................... | 404    | 15    |
^^.........^....^.^..^.......................................... | 223    | 0     |
^^................^..^.......^....................^............. | 0      | 612   |
```

Excellent! The violation still reproduces with the minimized program. We've successfully reduced the test case while preserving the vulnerability.

The program is still fairly complex, though. Let's run input minimization to identify exactly which values are being leaked.

### Analyze the leak through input minimization

```bash
$ revizor ./revizor.py minimize -s base.json -c ./violation/minimize.yaml -t ./violation/min.asm -o ./violation/min.asm -i 25  --input-outdir ./violation/min-inputs \
    --enable-input-diff-pass 1 \
    --enable-input-seq-pass 1 \
    --enable-instruction-pass false
```

Among other information, the minimizer prints the leaked values:

```
  > Minimizing the difference between inputs 2 and 3

Address    +0x0     +0x40    +0x80    +0xc0    +0x100   +0x140   +0x180   +0x1c0
0x00000000 ........ ....=... ........ ........ ........ ........ ........ ........
0x00000200 ........ ........ ........ ........ ........ ........ ........ ........
0x00000400 ........ ........ ........ ........ ........ ........ ........ ........
0x00000600 ........ ........ ........ ........ ........ ........ ........ ........
0x00000800 ........ ........ ........ ........ ........ ........ ........ ........
0x00000a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001000 ........ ........ ........ ........ ........ ........ ........ ........
0x00001200 ........ ........ ........ ........ ........ ........ ........ ........
0x00001400 ........ ........ ........ ........ ........ ........ ........ ........
0x00001600 ........ ........ ........ ........ ........ ........ ........ ........
0x00001800 ........ ........ ........ ........ ........ ........ ........ ........
0x00001a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00002000 ....^...
0x00002040 ........ ........ ........ ........
  > Result: Leaked 1 bytes
  > Addresses: ['0x2020']
```

There are two bits of information that we learn from here:

- Most of the input has been successfully zeroed-out (`.`). This means it is likely irrelevant to the leak.
- The only non-zero byte is at address `0x2020` (marked with `^`). This is likely the leaked byte.

To understand how this address maps to the test case, we need to look at the layout of the input: [here](../../ref/artifact-file-formats.md). We can see that the leak is within the GPR region of actor 0 (the only actor in this test case). Specifically, 0x2020 - 0x2000 = 0x20, is the offset used to initialize RSI (GPRs are ordered as: `rax`, `rbx`, `rcx`, `rdx`, `rsi`, `rdi`, `flags`, `rsp`).

Now we just need to find how the test case uses RSI (possibly speculatively), and we will have a good idea of the root-cause of the leak.

Let's inspect the minimized program in `./violation/min.asm`:

``` asm linenums="1"
.intel_syntax noprefix
.section .data.main
.function_0:
.macro.measurement_start: nop qword ptr [rax + 0xff]
add al, -118
and rdi, 0b1111111111100
adc al, byte ptr [r14 + rdi]
# mem access: [5] 0x1578 cl 21:56 | [15] 0x1578 cl 21:56
mov rax, -1332388169
imul eax, eax, -75
and rcx, 0b1111111111000
add dword ptr [r14 + rcx], eax
# mem access: [5] 0x2498-0x2498 cl 18:24 | [15] 0x2498-0x2498 cl 18:24
and rax, 0b1111111111000
imul qword ptr [r14 + rax]
# mem access: [5] 0x1060 cl 1:32 | [15] 0x1060 cl 1:32
and rcx, 0b1111111000000
lock inc qword ptr [r14 + rcx]
# mem access: [5] 0x2480-0x2480 cl 18:0 | [15] 0x2480-0x2480 cl 18:0
and rdi, 0b1111111111000
add byte ptr [r14 + rdi], al
# mem access: [5] 0x1578-0x1578 cl 21:56 | [15] 0x1578-0x1578 cl 21:56
sub dl, al
jp .bb_0.1
jmp .exit_0
.bb_0.1:
and rbx, 0b1111111111000
cmp dword ptr [r14 + rbx], eax
and rdi, 0b1111111111000
cmp qword ptr [r14 + rdi], rbx
and rbx, 0b1111111000000
lock sub word ptr [r14 + rbx], dx
and rbx, 0b1111111111000
dec word ptr [r14 + rbx]
and rsi, 0b1111111111000
neg qword ptr [r14 + rsi] # <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<< HERE: RSI is used here
and rbx, 0b1111111111000
adc ax, word ptr [r14 + rbx]
.exit_0:
.macro.measurement_end: nop qword ptr [rax + 0xff]
.section .data.main
.test_case_exit:nop
```

We can see that RSI is used in the instruction at line 36:

``` asm
neg qword ptr [r14 + rsi]
```

That already gives most of the information we need. We can see a clear Spectre V1 pattern here:

1. There is a conditional branch at line 24 (`jp .bb_0.1`)
2. And a load of a previously-unused value on a mispredicted path (line 36)

To verify that, let's inspect the actual value of RSI in the violating inputs (inputs 2 and 3 according to the minimizer output above). We can use `hexdump` for that:

``` bash
$ hexdump -C ./violation/min-inputs/min_input_0002.bin | grep 2020
00002020  93 22 00 00 93 22 00 00  00 00 00 00 00 00 00 00  |."..."..........|
$ hexdump -C ./violation/min-inputs/min_input_0003.bin | grep 2020
00002020  40 00 00 00 40 00 00 00  00 00 00 00 00 00 00 00  |@...@...........|
```

So the value of RSI were:

- Input 2: `rsi=0x0000229300002293`
- Input 3: `rsi=0x0000004000000040`

These values were masked by the instruction at line 35:

``` asm
and rsi, 0b1111111111000 # instrumentation
```

Which means that the values of RSI used in memory accesses at line 36 were:

- Input 2: `0x0000229300002293 & 0b1111111111000 = 0x290`
- Input 3: `0x0000004000000040 & 0b1111111111000 = 0x040`

All memory accesses within the test case are relative to `r14`, which is page-aligned and points to the base of the sandbox memory.

Therefore, we can calculate the ID of the cache lines accessed by the instruction at line 36 as follows:

- Input 2: cache line ID = `0x290 // 0x40 = 0xa = 10`
- Input 3: cache line ID = `0x040 // 0x40 = 0x1 = 1`

So, if our hypothesis is correct, we should see that in the hardware trace of the violation, cache lines 10 and 1 were accessed when executing inputs 2 and 3. Let's verify it by running rvzr in the reproduce mode:

```
$ ./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/min.asm -i ./violation/min-inputs/min_input_*.bin

-----------------------------------------------------------------------------------
                             HTrace                              | ID:2   | ID:3  |
-----------------------------------------------------------------------------------
^^........^..................................................... | 626    | 0     |
^^.............................................................. | 1      | 627   |

```

The first hardware trace (dominant for input 2) is:

```
^^........^.....................................................
||        |
||        Cache set 10 accessed
|Cache set 1
Cache set 0 accessed
```

The second hardware trace (dominant for input 3) is:

```
^^..............................................................
||
| Cache set 1 accessed
Cache set 0 accessed
```

Indeed, we see that our hypothesis is correct! The instruction at line 36 accessed different cache lines depending on the value of RSI, which was influenced by speculative execution after the conditional branch at line 24.

This tells us that the root-cause of the leak was misprediction of a conditional branch that led to speculative leak of a value (RSI) through a data access.

### Summary

Congratulations! We've successfully detected and analyzed a Spectre V1 vulnerability from start to finish.

!!! success "What We've Learned"
    In this section, we've walked through the complete workflow for detecting speculative execution vulnerabilities:

    - **Strategic planning**: Choosing a minimal instruction set and appropriate contract focused our search
    - **Violation detection**: Revizor found the vulnerability automatically in under two minutes
    - **Validation**: Reproduction confirmed the violation was genuine and stable
    - **Minimization**: We reduced a complex test case to its essential components
    - **Root-cause analysis**: By examining register values and cache access patterns, we identified the exact mechanism of the leak

    This same workflow applies to discovering and analyzing any speculative execution vulnerability.

### What's Next?

Proceed to [Tutorial 3](./03-faults.md) to see how the same principles can be applied to detect more complex vulnerabilities based on CPU exceptions and faults.


================================================
FILE: docs/intro/tutorials/03-faults.md
================================================
# Tutorial 3: Testing faults with Revizor

Having detected Spectre V1, let's now apply the same methodology to find a different vulnerability class. Meltdown-style vulnerabilities exploit speculative execution around exception handling rather than branch misprediction.

!!! important
    This tutorial relies on the knowledge about sandboxed execution and the memory layout of the sandbox. If you haven't read about it yet, please refer to the [Sandbox Reference](../../ref/sandbox.md) and the [Actors and Isolation Topic Guide](../../topics/actors.md) before proceeding.

### Plan the campaign

The key difference in this campaign is the speculation source. Instead of conditional branches, we'll test page faults. Meltdown and related vulnerabilities occur when a CPU speculatively executes instructions that follow a faulting memory access, potentially leaking data from inaccessible memory regions.

From the practical standpoint, the key difference that we will need to configure the [sandbox](../../ref/sandbox.md) to make it possible for the test case to trigger page faults. Namely, we will make one of the pages accessible by the test cases non-readable.

### Create the configuration file

Our configuration for this campaign makes three important changes from the Spectre V1 setup. First, we remove `BASE-COND_BR` from the instruction categories since we already know conditional branches cause Spectre V1 violations. This focuses our testing on other speculation sources.

Second, we add an `actors` section with `data_properties` to configure the sandbox memory layout. Revizor's sandbox allocates each actor two 4KB memory regions: a main area with normal read-write permissions and a faulty area where we can configure special permissions. By setting `present: false` in the data properties, we mark the faulty area as non-present in the page tables. When the test case attempts to access this region, the CPU will raise a page fault, giving us the exception-based speculation source we want to test.

Third, we change the contract execution clause to `delayed-exception-handling`. Modern CPUs implement out-of-order execution, so data-independent instructions after a fault may execute before the exception is recognized. This is expected behavior and would cause trivial violations under the strict `no_speculation` contract. The `delayed-exception-handling` clause accommodates this expected speculation, allowing Revizor to focus on more interesting leaks. For more details on contract selection, see [How to Choose a Contract](../../howto/choose-contract.md).

```yaml
# contract
contract_observation_clause: loads+stores+pc
contract_execution_clause:
  - delayed-exception-handling

# tested instructions
instruction_categories:
  - BASE-BINARY
  # - BASE-COND_BR

actors:
  - main:
    - data_properties:
      - present: false

enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true
```


### Run the fuzzer

With the configuration ready, let's run the fuzzer.

```
$ ./revizor.py fuzz -s base.json -c dbg/tut/2.yaml -n 1000 -i 20 -w .

INFO: [fuzzer] Starting at 12:05:26
66    ( 7%)| Stats: Cls:19/19,In:40,R:19,SF:0,OF:0,Fst:6,CN:60,CT:0,P1:0,CS:0,P2:0,V:0
```

Notice in the statistics that `SF:0,OF:0`—unlike the Spectre V1 campaign, none of our test cases are filtered by the speculation or observation filters since every test case with a page fault exhibits speculation.

Eventually (after a few minutes), Revizor detects a violation:

```
================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:3   | ID:23 |
-----------------------------------------------------------------------------------
^^.^.......^.........^..^.........................^............^ | 627    | 0     |
^^.^...^...^............^.........................^............^ | 0      | 627   |

```

The output is similar to what we saw in the Spectre V1 campaign, so we won't go into the details of reading the violation report again. The key takeaway is that we've successfully detected a contract violation, and the hardware traces show different cache access patterns for the two inputs.

### Validate the violation

As before, we validate the violation by reproducing it:

```
$ ./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/program.asm -i ./violation/input*.bin
```

The output should be similar to the original:

```
================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:3   | ID:23 |
-----------------------------------------------------------------------------------
^^.^.......^.........^..^.........................^............^ | 627    | 0     |
^^.^...^...^............^.........................^............^ | 0      | 627   |
```

Great! The violation reproduces successfully, confirming it's genuine.


### Minimize the test case

Now we minimize the test case to make it easier to analyze:

```
./revizor.py minimize -s base.json -c ./violation/minimize.yaml -t ./violation/program.asm  -o ./violation/min.asm -i 10 --num-attempts 3 \
    --enable-instruction-pass 1 \
    --enable-simplification-pass 1 \
    --enable-nop-pass 1 \
    --enable-constant-pass 1 \
    --enable-mask-pass 1 \
    --enable-label-pass 1
```

After the minimization completes, verify that the minimized program still reproduces the violation:

```
./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/min.asm -i ./violation/input*.bin

INFO: [prog_gen] Setting program_generator_seed to random value: 578824

INFO: [fuzzer] Starting at 12:14:08
> Entering slow path...> Priming  6             > Increasing sample size... to 50> Increasing sample size... to 100> Increasing sample size... to 500> Priming  6

================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:11  | ID:31 |
-----------------------------------------------------------------------------------
^^.^.......^...^........^.........................^...^........^ | 627    | 0     |
^^.^.......^...^........^.........................^............^ | 0      | 627   |
```

### Identify the leaked value

Next, we minimize the inputs to identify which specific values are being leaked:

```
./revizor.py minimize -s base.json -c ./violation/minimize.yaml -t ./violation/min.asm -o ./violation/min.asm -i 10 --input-outdir ./violation/min-inputs \
    --enable-input-diff-pass 1 \
    --enable-input-seq-pass 1 \
    --enable-comment-pass 1 \
    --enable-instruction-pass false

(skipping output for brevity)
  > Minimizing the difference between inputs 0 and 1

Address    +0x0     +0x40    +0x80    +0xc0    +0x100   +0x140   +0x180   +0x1c0
0x00000000 ........ ........ ........ ........ ........ ........ ........ ........
0x00000200 ........ ........ ........ ........ ........ ........ ........ ........
0x00000400 ........ ........ ........ ........ ........ ........ ........ ........
0x00000600 ........ ........ ........ ........ ........ ........ ........ ........
0x00000800 ........ ........ ........ ........ ........ ........ ........ ........
0x00000a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00000e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001000 ........ ........ ........ ........ ........ ........ ........ ........
0x00001200 ........ ........ ........ ........ ........ ........ ........ ........
0x00001400 ........ ........ ........ ........ ........ ........ ........ ........
0x00001600 ........ ........ ........ ........ ........ ........ ........ ........
0x00001800 ........ ........ ........ ........ ........ ........ ........ ........
0x00001a00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001c00 ........ ........ ........ ........ ........ ........ ........ ........
0x00001e00 ........ ........ ........ ........ ........ ........ ........ ........
0x00002000 ..=.=^..
0x00002040 ........ ........ ........ ........
  > Result: Leaked 1 bytes
  > Addresses: ['0x2028']
  > Saving new inputs in '/home/t-oleksenkoo/revizor/violation/min-inputs'
  > Violating input IDs: [5, 15]
```

Key takeaways:

- The leaked value originates from address `0x2028` in the input, which corresponds to offset `0x28` in the GPR initialization region of the sandbox memory, used to initialize the `RDI` register.
- Two other values in the input were not zeroed out, which indicates they are somehow relevant to triggering the violation. Namely, those are offsets `0x10` and `0x20`, which correspond to `RCX` and `RSI`.

### Perform root-cause analysis

With the minimized program and inputs, we can now investigate the root cause. The minimized program is as follows:

``` asm linenums="1"
.intel_syntax noprefix
.section .data.main
.function_0:
.macro.measurement_start: nop qword ptr [rax + 0xff]
and rsi, 0b1111111111000 # instrumentation
add rdi, qword ptr [r14 + rsi]
add cl, dl
and rcx, 0b1111111111000 # instrumentation
add qword ptr [r14 + rcx], rbx
and rbx, 0b1111111111000 # instrumentation
add dword ptr [r14 + rbx], ecx
and rax, 0b1111111111000 # instrumentation
cmp dword ptr [r14 + rax], ecx
and rdi, 0b1111111111000 # instrumentation
or byte ptr [r14 + rdi], 1 # instrumentation  # <<<<<<<<<<<<<<< HERE: RDI is used here
mov ax, 1 # instrumentation
div byte ptr [r14 + rdi]                      # <<<<<<<<<<<<<<< HERE: RDI is used here
and rsi, 0b1111111111000 # instrumentation
sub byte ptr [r14 + rsi], bl
and rcx, 0b1111111111000 # instrumentation
sub al, byte ptr [r14 + rcx]
and rcx, 0b1111111111000 # instrumentation
mul qword ptr [r14 + rcx]
and rax, 0b1111111000000 # instrumentation
lock sub word ptr [r14 + rax], -128
.macro.measurement_end: nop qword ptr [rax + 0xff]
.section .data.main
.test_case_exit:nop
```

RDI is used in two places:

1. Line 15: `or byte ptr [r14 + rdi], 1` (a write)
2. Line 17: `div byte ptr [r14 + rdi]` (a read)

This is a clear data-dependent pattern, which explains why RDI is being leaked. But normally, these patterns should not be reported as violations of CT-DEH (our selected contract), since the contract permits cache-based leakage. So if the violation was reported, it means these instructions were not executed in the model. Let's investigate why.

We will inspect how the model executes this program. To this end, we will add a debug flag to the config file:

```yaml
logging_modes:
    - dbg_model
```

Then, we will reproduce the violation again, now with a verbose log of test case execution on the model:

```
./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/min.asm -i ./violation/min-inputs/min_input_0000.bin

                     ##### Input 0 #####
0x0 : macro .measurement_start, .noarg
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000d04a0000d04a rdx=0x0000000000000000
  rsi=0x0000d0510000d051 rdi=0x000056b8000056b8 flags=0b000000000010
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

0x8 : and rsi, 0b1111111111000
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000d04a0000d04a rdx=0x0000000000000000
  rsi=0x0000d0510000d051 rdi=0x000056b8000056b8 flags=0b000000000010
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

0xf : add rdi, [r14 +rsi]
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000d04a0000d04a rdx=0x0000000000000000
  rsi=0x0000000000001050 rdi=0x000056b8000056b8 flags=0b000000000110
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

    > load from +0x2050 value 0x0
EXCEPTION #13: Read from non-readable memory (UC_ERR_READ_PROT)
0x13: [transient, nesting = 1] add cl, dl
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000d04a0000d04a rdx=0x0000000000000000
  rsi=0x0000000000001050 rdi=0x000056b8000056b8 flags=0b000000000110
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

0x15: [transient, nesting = 1] and rcx, 0b1111111111000
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000d04a0000d04a rdx=0x0000000000000000
  rsi=0x0000000000001050 rdi=0x000056b8000056b8 flags=0b000000000010
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

0x1c: [transient, nesting = 1] add [r14 +rcx], rbx
  rax=0x0000000000000000 rbx=0x0000000000000000 rcx=0x0000000000001048 rdx=0x0000000000000000
  rsi=0x0000000000001050 rdi=0x000056b8000056b8 flags=0b000000000110
  xmm0=0x00000000000000000000000000000000 xmm1=0x00000000000000000000000000000000
  xmm2=0x00000000000000000000000000000000 xmm3=0x00000000000000000000000000000000
  xmm4=0x00000000000000000000000000000000 xmm5=0x00000000000000000000000000000000
  xmm6=0x00000000000000000000000000000000 xmm7=0x00000000000000000000000000000000

    > load from +0x2048 value 0x0
EXCEPTION #13: Read from non-readable memory (UC_ERR_READ_PROT)
ROLLBACK to 0x7f
```

This log shows in detail which instructions from the test case were executed by the model, whether they were transient or non-transient, and the register/memory state before each instruction.

We can see that, early in the execution of the test case, a page fault occurs when trying to read from memory at address `0x2050`. This is because of the configuration we're using, where the second page of the sandbox memory (the faulty page) is set as non-readable.

Accordingly, since we're using `delayed-exception-handling` execution clause, the model will not execute any instructions that are data-dependent on this faulting load. This includes the two instructions that use RDI (lines 15 and 17), since RDI was computed based on the value loaded from address `0x2050`.

From this, we can conclude that the CPU implements some sort of speculation on page faults: The RDI-dependent instructions were not supposed to be executed, but we see leakage of RDI in cache traces nonetheless.

To understand what specific value is returned speculatively, we can manually modify the test case, and replace the instructions after the faulting load with a gadget that will specifically leak RDI:

``` asm linenums="1"
.intel_syntax noprefix
.section .data.main

.macro.measurement_start: nop qword ptr [rax + 0xff]
and rsi, 0b1111111111000 # instrumentation
mov rdi, qword ptr [r14 + rsi]

and rdi, 0b111111111111  # mask the value of RDI
mov rdi, qword ptr [r14 + rdi]
.macro.measurement_end: nop qword ptr [rax + 0xff]

.test_case_exit:
```

Will will also enable another debug mode to see the hardware traces even when no violation is detected:

```yaml
logging_modes:
    # - dbg_model
    - dbg_dump_htraces
```

Then, we can run the modified test case:

```
$ ./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml \
    -t ./violation/min.asm -i ./violation/min-inputs/min_input_0000.bin

================================ Collected Traces =============================
- Input 0:
  HTr:
    ^^.^.......^............^.........................^............^ [10]

  Feedback: (816, 685, 64, 0, 0)
```

We see that multiple cache lines were accesses, so it is hard to pinpoint the exact one that belongs to the speculative leak. (We likely have all these evictions due to the page walk triggered by the page fault.)

We can identify the specific cache line by further modifying the test case to add an hard offset to the speculative memory access, e.g., changing:

``` asm
mov rdi, qword ptr [r14 + rdi + 0x100]
```

Then, we can run it again and see how the hardware trace changes:

```
./revizor.py reproduce -s base.json -c ./violation/reproduce.yaml -t ./violation/min.asm -i ./violation/min-inputs/min_input_0000.bin

================================ Collected Traces =============================
- Input 0:
  HTr:
    ^^.^^......^............^.........................^............^ [10]

  Feedback: (816, 685, 71, 0, 0)
```

Let's compare it side-by-side with the previous trace:

```
Before: ^^.^.......^............^.........................^............^
After:  ^^.^^......^............^.........................^............^
            |
            + Added cache set access due to +0x100 offset
              (cache set ID 4)
```

This shows that the speculative access used cache set ID 4. From this, we can do a simple calculation to deduce the value of RDI that was used for the memory access:

```
Cache ID = 4
Cache Line Size = 0x40
Hardcoded Offset = 0x100
Speculative Address = (Cache ID * Cache Line Size) = rdi + Hardcoded Offset // ignore r14
=>
rdi_masked = (Cache ID * Cache Line Size) - Hardcoded Offset = (4 * 0x40) - 0x100 = 0x0
```

Now we know that the masked value of RDI used in the speculative access was `0x0`. The remaining part is to figure out what was the original value of RDI before masking. For that, we can shift the pre-mask value of RDI by 12 bits (since the mask is `0b111111111111` = 0xfff = 12 bits) and repeat the procedure. We'll do 6 times to reveal the whole value.

The resulting traces are as follows:

```
no shift: ^^.^.......^............^.........................^............^
12 bits:  ^^.^.......^............^.........................^............^
24 bits:  ^^.^.......^............^.........................^............^
36 bits:  ^^.^.......^............^.........................^............^
48 bits:  ^^.^.......^............^.........................^............^
60 bits:  ^^.^.......^............^.........................^............^
```

We can see that in all cases, the cache set accessed is 0, which means that the masked value of RDI was always 0, regardless of how much we shifted it.

This tells us that the faulting load returned 0 speculatively, which reveals to us the root cause of the violation. This is an instance of a previously-discovered vulnerability called LVI-Null, which we have successfully and independently rediscovered using Revizor!

!!! success "What We've Learned"
    In this section, we applied the same systematic workflow to a different vulnerability class:

    - **Flexible configuration**: By changing just a few configuration options (removing branches, adding page faults, adjusting the contract), we refocused our search entirely
    - **Contract selection matters**: The `delayed-exception-handling` contract helped filter out trivial violations while exposing genuine leaks
    - **Deep analysis techniques**: We manually modified test cases and used offset manipulation to precisely identify what value the CPU returned speculatively

    The same workflow—plan, configure, fuzz, validate, minimize, analyze—works across all speculative execution vulnerability classes.

### What's Next?

Proceed to [Tutorial 4](./04-isolation.md) to see how we can go even further and start testing high-level isolation properties.


================================================
FILE: docs/intro/tutorials/04-isolation.md
================================================
# Tutorial 4: Testing Security Domain Isolation with Revizor

In the previous tutorials, we used random test generation to find Spectre V1 and LVI-Null by testing against contracts. While contract violations are interesting, the most critical security issues often arise from failures in isolation between different security domains—such as user vs kernel mode, or different virtual machines.

In this tutorial, we'll explore how to use Revizor's template-based fuzzing and multi-actor testing features to evaluate isolation guarantees. Specifically, we'll test whether privileged kernel code can leak information to unprivileged user code through speculative execution.

### Preliminaries

Through this tutorial, you should become familiar with three concepts: actors, templates, and actor non-interference. These concepts are covered in detail in the [Topic Guide: Actors](../../topics/actors.md) and [Howto: Use Templates](../../howto/use-templates.md), but we'll provide a brief overview here.

**Actors** are an abstraction that separates a test case into multiple components, each with its own code, execution context, privilege level, and memory space. This allows us to model scenarios where different parts of the test case run under different security domains. For example, we can define a `kernel` actor that runs in kernel mode and a `user` actor that runs in user mode. While they will have separate memory spaces and are isolated through privilege separation by the CPU, information could still leak from the kernel actor to the user actor through side channels; Revizor helps us detect such leaks.

**Templates** are assembly files that define the high-level structure of test cases. They allow us to specify hard-coded parts of the test case and its actors, while still leaving room for random instruction generation.

Templates are essential for testing isolation because they define how different actors interact. For example, a template can specify that the user actor calls into the kernel actor, which processes secret data, and then returns control to the user actor for observation. This structure is unlikely to be generated through pure randomness, so templates enable targeted testing of specific attack patterns.

**Actor Non-Interference Contract** is a specialized contract that checks whether one actor's execution can influence another actor's observations. In our case, we want to ensure that the kernel actor's processing of secret data does not affect what the user actor can observe through side channels. If the user actor's hardware trace differs based on the kernel actor's secret data, that's a non-interference violation, indicating a potential isolation failure.

### Plan the campaign

Let's imagine we want to test whether a CPU properly enforces isolation between kernel and user mode. Specifically, we want to check if privileged kernel code can leak information to unprivileged user code through speculative execution side channels—attacks like Meltdown exploit exactly this type of isolation failure.

For this campaign, we'll use a two-actor setup: a kernel actor (the victim) that processes secret data, and a user actor (the attacker) that attempts to observe those secrets through side channels. Rather than relying on pure random generation, we'll use a template that explicitly encodes the interaction pattern: the kernel processes data, then transfers control to user mode, where observation code runs. This template-based approach ensures we're testing the specific isolation boundary we care about.

We'll pair this multi-actor test structure with the Actor Non-Interference contract. This contract checks whether the user actor's hardware traces (cache state, timing, etc.) differ based on the kernel actor's input data. If they do, it means information crossed the privilege boundary—a clear isolation failure. Unlike model-based contracts that compare hardware against an idealized model, non-interference testing directly verifies that one actor cannot observe another actor's secrets, which is precisely the security property we want to enforce.

With this campaign plan, we are trying to answer a specific question: "Can unprivileged code observe secrets from privileged code through speculative side channels?"


### Create the configuration file

```yaml
# contract for isolation testing
contract_observation_clause: ct-ni

# instruction categories
instruction_categories:
  - BASE-BINARY

# actor configuration
actors:
  - main:
      - privilege_level: "kernel"
      - observer: false
  - user:
      - privilege_level: "user"
      - observer: true

# filters
enable_speculation_filter: true
enable_observation_filter: true
enable_fast_path_model: true
```

This configuration introduces several important concepts. The `contract_observation_clause` is set to `ct-ni`, which tells Revizor to use the Actor Non-Interference check instead of the standard model-based testing.

The `actors` section defines two execution contexts. The `main` actor runs in kernel mode (`mode: kernel`) and has `observer: false`, meaning it's the victim whose secrets might leak. The `user` actor runs in user mode (`mode: user`) and has `observer: true`, meaning it's the attacker trying to observe kernel secrets through side channels.

For more details on actor configuration, see [Topic Guide: Actors](../../topics/actors.md).

### Create the template

Now we need a template that exercises the kernel-user boundary. Create `template.asm`:

``` asm
.intel_syntax noprefix

# ----------------------------- Kernel-mode Actor (Victim) -------------------
.section .data.main
.function_main_1:
    # random code of the victim
    .macro.random_instructions.16.8.main_1:

    # switch to user actor to observe
    .macro.set_k2u_target.user.function_user_1:
    .macro.set_u2k_target.main.function_main_2:
    .macro.switch_k2u.user.1:

.macro.fault_handler:
    # one more call to the user to complete the measurement in case of a fault
    .macro.set_k2u_target.user.function_user_2:
    .macro.set_u2k_target.main.function_main_3:
    .macro.switch_k2u.user.2:

# return point for the user actor
.function_main_2:
    .macro.landing_u2k.main_2:

# exit
.function_main_3:
    .macro.landing_u2k.main_3:
    nop

# ----------------------------- User-mode Actor ------------------------------
.section .data.user
.function_user_1:
    # reset registers to ensure we're not observing leftover state
    .macro.landing_k2u.user_1:
    xor rax, rax  # noremove
    mov rax, qword ptr [r14 + 0x2000] # noremove
    mov rbx, qword ptr [r14 + 0x2008] # noremove
    mov rcx, qword ptr [r14 + 0x2010] # noremove
    mov rdx, qword ptr [r14 + 0x2018] # noremove
    mov rsi, qword ptr [r14 + 0x2020] # noremove
    mov rdi, qword ptr [r14 + 0x2028] # noremove
    lfence

    # attacker code to observe side effects
    .macro.measurement_start:
    .macro.random_instructions.16.8.user_1:
    .macro.measurement_end.1:

    # switch back to kernel actor
    .macro.switch_u2k.main.1:

# second measurement call; for the cases when the first one was bypassed by a fault
.function_user_2:
    .macro.landing_k2u.user_2:
    .macro.measurement_end.2:
    .macro.switch_u2k.main.2:
    lfence

# ----------------------------- Exit -----------------------------------------
.section .data.main
.test_case_exit:
```

Let's break down this template block by block to understand how it orchestrates the kernel-user isolation test:

**Kernel Actor - Initial Execution (`function_main_1`)**

```asm
.section .data.main
.function_main_1:
    .macro.random_instructions.16.8.main_1:
```

The template begins in the kernel actor's code space (`.section .data.main`). The `.macro.random_instructions.16.8.main_1` macro generates 16 random instructions with an average of 8 memory accesses. This randomized kernel code represents the victim's execution.

**Transition Setup - Kernel to User**

```asm
    .macro.set_k2u_target.user.function_user_1:
    .macro.set_u2k_target.main.function_main_2:
    .macro.switch_k2u.user.1:
```

These macros configure and execute a privilege level transition. The `set_k2u_target` macro specifies that when dropping to user mode, execution should begin at `function_user_1` in the `user` actor. The `set_u2k_target` macro specifies that when returning to kernel mode, execution should resume at `function_main_2` in the `main` actor. Finally, `switch_k2u` performs the actual privilege drop, transferring control to user mode. The `.1` suffix is a unique label for this transition.

**Kernel Actor - Return Point (`function_main_2`)**

```asm
.function_main_2:
    .macro.landing_u2k.main_2:
    .macro.fault_handler:
```

This is where the kernel resumes after the user actor returns control. The `landing_u2k` macro handles the privilege escalation transition, restoring the kernel execution context. The `fault_handler` macro designates this location as the exception handler—if any faults occur during execution (in either actor), control transfers here.

**Second Transition - Kernel to User Again**

```asm
    .macro.set_k2u_target.user.function_user_2:
    .macro.set_u2k_target.main.function_main_3:
    .macro.switch_k2u.user.2:
```

The kernel performs another transition to user mode, this time to `function_user_2`. This is necessary because, if the random code in the user actor triggers a fault, the `measurement_end` may never be reached, and the hardware trace would be corrupted. By splitting the measurement into two parts, we ensure that even if a fault occurs during the first measurement, we can still capture whatever trace was collected up to that point.

**Kernel Actor - Exit (`function_main_3`)**

```asm
.function_main_3:
    .macro.landing_u2k.main_3:
    nop
```

The final kernel return point. After the second user-mode measurement completes, execution returns here and falls through to the test case exit.

**User Actor - First Observation (`function_user_1`)**

```asm
.section .data.user
.function_user_1:
    .macro.landing_k2u.user_1:
    xor rax, rax  # noremove
    mov rax, qword ptr [r14 + 0x2000] # noremove
    mov rbx, qword ptr [r14 + 0x2008] # noremove
    ...
    lfence
```

This is where the attacker code executes. The `landing_k2u` macro handles the privilege drop transition, setting up the user execution context. The explicit register initialization loads fresh values from memory (via `r14`, which points to the sandbox memory). The `# noremove` comments prevent Revizor's minimization passes from removing these instructions—they're essential for resetting architectural state. The `lfence` ensures these loads complete before observation begins, preventing them from affecting the measurement.

**User Actor - Measurement**

```asm
    .macro.measurement_start:
    .macro.random_instructions.16.8.user_1:
    .macro.measurement_end.1:
```

The `measurement_start` macro marks where hardware trace collection begins. Only code between `measurement_start` and `measurement_end` contributes to the observed side-channel trace. The random instructions here represent attacker code that might be sensitive to cache state, timing variations, or other microarchitectural side effects left by the kernel's execution. The `.1` suffix distinguishes this measurement from the second one.

**User Actor - Return to Kernel**

```asm
    .macro.switch_u2k.main.1:
```

The `switch_u2k` macro performs a privilege escalation, returning control to the kernel actor. This transition was pre-configured earlier by the `set_u2k_target` macro.

**User Actor - Second Observation (`function_user_2`)**

```asm
.function_user_2:
    .macro.landing_k2u.user_2:
    .macro.measurement_end.2:
    .macro.switch_u2k.main.2:
    lfence
```

The second user-mode entry point completes the measurement that was started in `function_user_1`.

### Run the isolation test

Execute the multi-actor fuzzing campaign:

```bash
./revizor.py tfuzz -s base.json -c config.yaml -t template.asm -n 1000 -i 10 -w .
```

We're running 1000 test cases with 10 inputs each. Multi-actor testing often requires more iterations to find violations because we're looking for interactions between actors, which adds complexity.

The fuzzer will run and search for isolation violations. On most systems, you will not find a violation; isolation mechanisms are generally robust. We will need to try harder to find issues.

```
Duration: 60.5
Finished at 08:44:40
```

### Adding Faults

Now let's add a little more complexity to the experiment. We will make the attacker "active" by allowing the user actor to try and access the memory of the kernel actor. This simulates an attacker that attempts to read privileged memory, which should be blocked by the CPU's privilege separation.

To do this, we will use a generator pass that is specifically designed for this purpose. The `user-to-kernel-access` pass randomly selects a memory access from the user actor's code and modifies it to access the kernel actor's memory space. This creates a faulting access that the CPU should prevent.

Update the configuration file to include this generator pass:

```yaml
faults_allowlist:
  - user-to-kernel-access

# actor configuration
actors:
  - main:
      - privilege_level: "kernel"
      - observer: false
      - fault_blocklist:
        - user-to-kernel-access
  - user:
      - privilege_level: "user"
      - observer: true
```

Note that we also added a `fault_blocklist` to the kernel actor. This is done to prevent redundant work on the generator side; there is no point in making kernel access its own memory.

### Run the fuzzer with faults enabled

Run the fuzzer again with the updated configuration:

```bash
./revizor.py tfuzz -s base.json -c config.yaml -t template.asm -n 5000 -i 10 -w .
```

This time, with the user actor actively trying to access kernel memory, we have a higher chance of provoking isolation violations.

If you're testing a system vulnerable to Meltdown, you should see a violation reported:

```
================================ Violations detected ==========================
Violation Details:

-----------------------------------------------------------------------------------
                             HTrace                              | ID:3   | ID:13 |
-----------------------------------------------------------------------------------
^^.^.......^.........^..^.........................^............^ | 627    | 0     |
^^.^...^...^............^.........................^............^ | 0      | 627   |
```

Validate and minimize the violation, as we've done in the previous tutorials.

As a result, you should obtain a minimized test case that contains a typical Meltdown pattern: the user actor attempts to read kernel memory, which causes a fault, but speculative execution allows some of the kernel data to leak through side channels, and thus impact the user's hardware traces.

!!! success "What We've Learned"
    In this tutorial, we've progressed from random fuzzing to structured testing:

    - **Templates provide structure**: When testing specific attack scenarios, templates let us encode the essential pattern while still benefiting from randomization
    - **Macros control generation**: The macro system gives fine-grained control over what code gets generated and where
    - **Multi-actor testing**: Revizor can test isolation between different privilege levels or security domains using the actor system
    - **Noninterference contract**: This specialized contract detects when one actor's data influences another actor's observations

### What's Next?

This concludes our tutorials on using Revizor for security testing. Note that all examples in the tutorials were simplified for clarity. If you wish to explore more realistic scenarios, refer to our guide on [Design a Campaign](../../howto/design-campaign.md) or check an advanced tutorial on [Detecting TSA-SQ](./tsa-sq.md).

Proceed to [Tutorial 5](./05-extending.md) to learn how you can extend various components of Revizor to fit your research needs.


================================================
FILE: docs/intro/tutorials/05-extending.md
================================================
# Tutorial 5: Extending Revizor

In this tutorial, we will switch gears: instead of using Revizor's existing components, we will extend Revizor by adding custom functionality to some of its core modules.

## Workflow

The general workflow for extending any part of Revizor is as follows:

- Subclass the exiting module or interface you want to extend. For a list of all interfaces, refer to the [Architecture Overview](../../internals/architecture/overview.md) document.
- Implement your custom logic by overwriting the necessary methods.
- Register your new class in the factory so that Revizor can access the new implementation. It will also enable the user to select the new implementation via a config file.
- Add new configuration options if your extension requires additional parameters.

## Changing Data Generation Algorithm

As our first example, we will modify the data (input) generation algorithm used by Revizor. By default, Revizor generates random input data for each test case. However, in some scenarios, it may be beneficial to generate inputs that contain extreme values (e.g., minimum or maximum integers) to test edge cases in the microarchitecture. We will implement this feature.

The data generation logic is defined by the `DataGenerator` interface, with its default implementation located in `rvzr/data_generator.py`. We will create a new subclass of `DataGenerator` that generates minimum or maximum integer values with a configurable probability.

Implement the new generation algorithm by overwriting the generation logic in the default `DataGenerator` class.

``` python
# rvzr/data_generator.py
class MinMaxIntGenerator(DataGenerator):
    """
    A variant of DataGenerator that generates minimum or maximum integer
    values with a configurable probability.
    """
    int_sizes: Final[List[int]] = [8, 16, 32, 64]

    def __init__(self, seed: int):
        super().__init__(seed)
        self._probability_of_max = CONF.input_gen_probability_of_minmax

    def _generate_one(self, state: int, n_actors: int) -> Tuple[InputData, int]:
        input_ = InputData(n_actors)
        input_.seed = state

        per_actor_data_size = input_.itemsize // 8

        rng = np.random.default_rng(seed=state)
        for i in range(n_actors):
            # generate random data
            data = rng.integers(
                self.max_input_value, size=per_actor_data_size, dtype=np.uint64)  # type: ignore

            # if the probability of max is 0, we're done
            if self._probability_of_max == 0:
                input_.set_actor_data(i, data)
                continue

            # otherwise, with a given probability, set some values to min or max int
            for val_id in range(per_actor_data_size):
                roll = rng.random()
                if roll > self._probability_of_max:
                    continue
                int_size = random.choice(self.int_sizes)
                int_sign = random.choice([True, False])
                value = (2 ** (int_size - 1))
                if not int_sign:
                    value = -value
                data[val_id] = np.uint64(value & 0xFFFFFFFFFFFFFFFF)

            input_.set_actor_data(i, data)

        return input_, state + 1
```

We now need to let Revizor know about the existence of this new class. This is achieved by via the factory module `rvzr/factory.py`:

``` python
# rvzr/factory.py
_DATA_GENERATORS: Dict[str, Type[data_generator.DataGenerator]] = {
    'random': data_generator.DataGenerator,
    'minmax': data_generator.MinMaxIntGenerator,  # <<<<<<<<<<<<<<<< ADDED LINE
}
```

Finally, our implementation used a new config option (`input_gen_probability_of_minmax`) to control the probability of generating extreme values. We need to register this new option in the configuration module `rvzr/config.py`:

``` python
# rvzr/config.py
class Config:
    ...
    input_gen_probability_of_minmax: float = 0.5  # <<<<<<<<<<<<<<<< ADDED LINE
```

That's it. That's all it takes to change the data generation algorithm in Revizor.

Now, let's test the implementation:

``` yaml
# config.yaml
data_generator: minmax
input_gen_probability_of_minmax: 0.7
```

Run Revizor with the new configuration:

``` shell
./revizor.py generate -s base.json -c config.yaml -w ./ -n 1 -i 1
```

See that the new generator was applied:

```
$ hexdump -C ./tc0/input0.bin| head -10
00000000  80 ff ff ff ff ff ff ff  00 00 00 00 00 00 00 80  |................|
00000010  00 80 ff ff ff ff ff ff  2a 35 00 00 00 00 00 00  |........*5......|
00000020  80 00 00 00 00 00 00 00  00 80 00 00 00 00 00 00  |................|
00000030  c4 83 00 00 00 00 00 00  37 26 00 00 00 00 00 00  |........7&......|
00000040  36 d5 00 00 00 00 00 00  00 80 ff ff ff ff ff ff  |6...............|
00000050  41 27 00 00 00 00 00 00  00 80 00 00 00 00 00 00  |A'..............|
00000060  32 69 00 00 00 00 00 00  64 b0 00 00 00 00 00 00  |2i......d.......|
00000070  00 80 ff ff ff ff ff ff  7c d7 00 00 00 00 00 00  |........|.......|
00000080  00 00 00 00 00 00 00 80  00 80 00 00 00 00 00 00  |................|
00000090  31 86 00 00 00 00 00 00  f9 f4 00 00 00 00 00 00  |1...............|
```

Success! We can see large and small integer values in the generated input data (`ff ff ff ...`),
meaning that our new data generator is working as expected.

## Adding a Code Generation Pass

We will now explore the other part of the test case generation pipeline - generation of test case programs (code). In this example, we will add a new code generation pass that replaces all registers in the test case with a fixed register (`RAX`).

!!! note
    Frankly, it is not a very useful generation pass, but it serves the purpose of demonstration. The same principles apply to more complex generation passes.

We will follow the same steps as before. The code pass interface is located in `rvzr/code_generator.py` as the `Pass` class. We will create a new subclass of it, and, since we are creating an ISA-specific pass, we will place it into `rvzr/arch/x86/generator.py`.

``` python
# rvzr/arch/x86/generator.py
class _X86RaxPass(Pass):
    """
    Demonstration-only pass that replaces all register operands with RAX.
    """

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        for bb in test_case.iter_basic_blocks():
            for node in bb.iter_nodes():
                inst = node.instruction
                for op in inst.operands:
                    if isinstance(op, RegisterOp):
                        op.value = "rax"
```

Register the new class with the generator:

``` python
# rvzr/arch/x86/generator.py
class X86Generator(CodeGenerator):
    ...
        self._passes = [
            _X86PatchUndefinedFlagsPass(self._instruction_set, self),
            _X86SandboxPass(self._target_desc, self._faults),
            _X86PatchUndefinedResultPass(),
            _X86RaxPass(),  # <<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<< ADDED LINE
        ]
```

That's it. Now, let's test our new code generation pass by running Revizor again:

```
./revizor.py generate -w . -n 1 -i 1 -s base.json
```

Check the generated program:

```
$ cat tc0/program.asm | head -10

.intel_syntax noprefix
.section .data.main
.function_0:
.bb_0.0:
.macro.measurement_start: nop qword ptr [rax + 0xff]
and rax, 0b1111111111000 # instrumentation
lock add byte ptr [r14 + rdi], rax
cmp rax, 106
or rax, 0b1000000000000000000000000000000 # instrumentation
bsr rax, rax
```

As we can see, all register operands have been replaced with `RAX`, confirming that our new code generation pass is functioning correctly.


================================================
FILE: docs/intro/tutorials/tsa-sq.md
================================================
# Tutorial: Detecting TSA-SQ with Revizor

This tutorial demonstrates how we used Revizor to detect TSA-SQ (Transient Scheduler Attack - Store Queue), a microarchitectural vulnerability discovered in AMD Zen4 processors. We'll walk through the design rationale behind the fuzzing campaign configuration and template, explaining how each component contributes to successful vulnerability detection.

You can reproduce this campaign using the provided configuration and template files, which are available in the Revizor repository under `demo/tsa-sq/`.

!!! info "Prerequisites"
    To follow this tutorial, you should have:

    - Non-virtualized access to an AMD Zen4 processor for testing
    - A working installation of Revizor. See [installation guide](../02-install.md) for setup instructions.
    - Basic understanding of Revizor's fuzzing framework, in particular the concepts of [model-based relational testing](../03-primer.md), [actors](../../topics/actors.md), [templates](../../howto/use-templates.md), [macros](../../ref/macros.md).
    - Familiarity with microarchitectural vulnerabilities and side-channel attacks


## Background: Understanding TSA-SQ

Before diving into the Revizor configuration, let's briefly understand what TSA-SQ is. According to the [AMD security bulletin](https://www.amd.com/content/dam/amd/en/documents/resources/bulletin/technical-guidance-for-mitigating-transient-scheduler-attacks.pdf), TSA-SQ exploits timing variations in the CPU's store queue during "false completion" events. When a load instruction matches the address of an older store whose data isn't yet available, it may complete falsely using stale data from a previous store that occupied the same store queue entry. This creates timing differences that an attacker can observe to infer information about previous stores, even from different privilege levels.

The key insight is that an unprivileged user process can potentially observe timing variations that depend on data from kernel stores, creating a kernel-to-user information leak channel.

## Design Rationale

When this campaign was designed, we were not yet aware of the TSA-SQ vulnerability (in fact, the vulnerability was discovered as *result* of this campaign). Therefore, the campaign design is not specifically tailored to detect TSA-SQ, but rather to stress-test the general isolation between kernel and user modes in a way that could reveal microarchitectural vulnerabilities.

## Threat Model and Actor Configuration

Our fuzzing campaign targets a common and high-impact threat model: a malicious user process attempting to extract sensitive data from the kernel. This scenario is particularly relevant for privilege escalation attacks where an attacker seeks to leak kernel secrets.

The actor section of `config.yaml` reflects this threat model:

```yaml
actors:
  - main:
    - mode: "host"
    - privilege_level: "kernel"
    ...
  - user:
    - observer: true
    - mode: "host"
    - privilege_level: "user"
```

The `main` actor represents the victim kernel, while the `user` actor represents the attacker. The `observer: true` flag designates the user actor as the attacker attempting to extract information. This configuration, in combination with the noninterference contract, tells Revizor that any information leakage from `main` to `user` should be flagged as a violation.

## Template Design: Simulating Attack Patterns

The template structure follows the typical flow of a microarchitectural side-channel attack, specifically implementing a Flush+Reload pattern across privilege transitions.

![tsa-sq-template.png](../../assets/tsa-sq-template.png)

You can find the complete template in [`template.asm`](https://github.com/microsoft/side-channel-fuzzer/blob/main/demo/tsa-sq/template.asm).

Let's examine each phase:

**Phase 1: Setup and Flush (function_main_0 and function_user_0)**

The first stage represent the attacker preparing the microarchitectural state for measurements. The first action in the template is in the `function_user_0`, where the `user` actor initializes the microarchitectural state by flushing the cache lines that will be used for measurements. This is done using the `measurement_start` macro, which is translated into a Flush stage of Flush+Reload attack. Revizor does this translation automatically based on the `executor_mode: F+R` setting in the configuration file.

Note that the template does not actually start from the `function_user_0` actor function. Instead, it starts with the `function_main_0`, which is a function belonging to the `main` actor. This is because Revizor requires that the entry point to the test case must be within the `main` actor's code.

**Phase 2: Secret Injection (function_main_1)**

After the initial setup, the attacker transitions to the victim and let's it do some computations on the victim's secret data. The victim actor execute a sequence of random instructions in the `function_main_1` macro, which simulates the kernel performing operations on sensitive data. Here, "random instructions" means a sequence of instructions that is randomly generated in each fuzzing round (i.e., each generated test case will have a different sequence of instructions in `function_main_1`).

This randomness is crucial because it allows us to test a wide range of ways how secret data can impact microarchitectural state, without knowing a priori what specific instruction sequences might trigger a leak. This was one of the key factors that allowed us to discover TSA vulnerabilities without knowing about them beforehand.

**Phase 3: Secret Extraction (function_user_1)**

Back in user mode, we first clear the architectural state to eliminate any architectural information flow between actors. This is necessary to prevent any architectural information flows between the actors, which could otherwise lead to false positives in the analysis because Revizor is unable to distinguish between architectural and microarchitectural information flows (to be precise, Revizor would be able to distinguish them with a more subtle contract, but re-initializing the registers is a simpler solution).

```assembly
xor rax, rax  # noremove
mov rax, qword ptr [r14 + 0x2000] # noremove
mov rbx, qword ptr [r14 + 0x2008] # noremove
# ... more register initialization
```

After that, the attacker execute another sequence of random instructions, which simulates the user process attempting to access the sensitive data that was just processed by the kernel. Note that this sequence may include an attempt to access kernel memory from the user mode (see the `user-to-kernel-access` fault allowlist in the configuration). As we found out post-factum, this is not strictly necessary for TSA-SQ, but it helps to create complex microarchitectural conditions that can trigger the leak.

Depending on whether random instruction sequence triggers the fault, the user actor will either switch to the kernel mode explicitly (using the `switch_u2k.main.user_1` macro) or the CPU will transfer control to the fault handler (`fault_handler` macro in the `function_main_2`). In this experiment, we were not particularly interested in fault handling, so both paths lead to the same point in the template.

**Phase 4: State Measurement (function_user_2)**

Finally, the "Reload" stage in `function_user_2` measures which cache lines were accessed by the random code in the previous stage. If the accessed cache lines were somehow influenced by the kernel's secret data, this will lead to a discrepancy in the "Reload" measurements, leading to diverging hardware traces for different inputs, and ultimately to Revizor detecting a violation.

## Configuration Overview

Beyond the actor configuration, `config.yaml` contains several other important settings that guide the fuzzing campaign, as described next:

* **Contract**: The contract configuration specifies what information leakage we consider acceptable

```yaml
contract_observation_clause: ct
contract_execution_clause:
  - noninterference
```

The `noninterference` execution clause implements the security property that observer actors cannot learn information about non-observer actors through microarchitectural channels. Combined with the `ct` (constant-time) observation clause, this allows the observer to see memory access patterns and control flow but prohibits leakage of raw data values.

* **Exceptions**: The configuration includes `user-to-kernel-access` in the fault allowlist, which enables testing for Meltdown-type vulnerabilities. This was part of our original experimental design when we didn't yet know about TSA's existence. Revizor's program generator will randomly select memory accesses in the user actor and modify them to target kernel memory, triggering page faults.

Interestingly, this exception-based approach helped discover TSA-SQ because the false completion events in the store queue can lead to timing differences in subsequent instructions, and the faults provide a constant-time reference point for the timing differences to get transformed into persistent cache state. Namely, when a variable-latency instruction is executed concurrently with a faulting instruction, it creates a race condition, where the cache impact of the variable-latency instruction can be influenced by whether the faulting instruction completes before or after it.

Note the fault configuration quirk: we enable `user-to-kernel-access` globally but block it specifically for the main actor using `fault_blocklist`. This is the only way to enable a fault for a specific actor, because Revizor does not allow faults to be allow-listed for a specific actor.

* **Statistical Analysis**: The statistical analysis parameters balance sensitivity with noise tolerance:

```yaml
analyser_stat_threshold: 0.05
executor_sample_sizes: [15, 40, 160, 320]
```

The low threshold of 0.05 makes the analysis sensitive to subtle timing differences, while the adaptive sample sizes allow Revizor to start with quick tests and increase precision when potential violations are detected.

* **Instruction Set**: The instruction set is defined as `x86-64` because we are targeting AMD CPUs, and the instruction categories include all base instructions, which allows for a wide range of microarchitectural interactions in the randomly generated code. Ideally, we would include even more categories, such as SIMD extensions and other advanced instructions, but Revizor does not yet support them (coming up soon, though!).

## Running the Campaign

With the configuration and template in place, we can run the detection campaign using Revizor's `tfuzz` command. This command generates test cases based on the provided template and configuration, executes them, and analyzes the results for violations.

```shell
./revizor.py tfuzz -s base.json --save-violations t -w ./results/ \
    -c config.yaml -t template.asm -n 100000 -i 25
```

This runs 100,000 test cases with 25 inputs each. The `--save-violations` flag preserves any detected violations for later analysis. When TSA-SQ is present, you'll eventually see output similar to:

```
================================ Violations detected ==========================
Contract trace:
 14140085380608124960 (hash)
Hardware traces:
  Input group 1: [11]
  Input group 2: [36]
  ^^^.........^.................................^^................ [287    | 36    ]
  ^^^.........^.................................^................. [31     | 284   ]
```

The different hardware trace patterns for inputs 11 and 36, despite having the same contract trace hash, indicate that the CPU is leaking information not predicted by the noninterference contract.

On our machine, the campaign typically takes about 5 hours to detect a leak, but your mileage may vary depending on the CPU model and due to the inherent randomness of the process.

## Verifying Genuine Violations

To confirm that a detected violation is genuine, reproduce it using:

```bash
./revizor.py reproduce -s base.json -c ./results/violation-*/reproduce.yaml \
    -t ./results/violation-*/program.asm -i ./results/violation-*/input_*.bin
```

A genuine violation will reproduce consistently across multiple runs with the same statistical pattern, confirming that the timing differences represent a real microarchitectural information leak.

The next step is to do root-cause analysis of the violation, which is beyond the scope of this tutorial. See [Root-Causing a Violation Detected by Revizor](../../howto/root-cause-a-violation.md) for details on this process.


================================================
FILE: docs/ref/artifact-file-formats.md
================================================
# Artifact File Formats

This document describes the structure of violations artifact files stored by Revizor when it detects a contract violation.

## Program Artifact Format

The program artifact is stored as an assembly file named `program.asm` in the violation directory (e.g., `violation-<timestamp>/program.asm`).

The file uses Intel syntax and is structured around actors, with each actor's code placed in a separate section.

The program artifact is structured as follows:

```asm
.intel_syntax noprefix         # Required: Use Intel syntax
.test_case_enter:              # Required: marks the beginning of the test case

.section .data.main            # Start of "main" actor section
...                            # Instructions for main actor,
                               # including possible control transfers to other actors

.test_case_exit:               # Required: marks the end of the test case;
                               # Must be within the "main" actor section

.section .data.actor2          # Start of "actor2" actor section
...                            # Instructions for actor2
```


## Input Data Artifact Format

The inputs to the program are stored as binary files in the violation directory, named according to their order in the input sequence (e.g., `violation-<timestamp>/input_004.bin`).

The format mimics the layout of the [sandbox memory](sandbox.md), with the only exception that some of the sections are removed as they are irrelevant for input data (e.g., the MACRO STACK and the padding areas).

The layout of the input data files is as follows:

| Offset | Actor ID | Section Name | Size, B |
| ------ | -------- | ------------ | ------- |
| 0x0    | ACTOR 0  | MAIN AREA    | 0x1000  |
| 0x1000 |          | FAULTY AREA  | 0x1000  |
| 0x2000 |          | GPR AREA     | 0x40    |
| 0x2040 |          | SIMD AREA    | 0x100   |
| 0x2140 |          | (unused)     | 0xec0   |
| 0x0    | ACTOR 1  | MAIN AREA    | 0x1000  |
| 0x1000 |          | FAULTY AREA  | 0x1000  |
| 0x2000 |          | GPR AREA     | 0x40    |
| 0x2040 |          | SIMD AREA    | 0x100   |
| 0x2140 |          | (unused)     | 0xec0   |
| ...    | ...      | ...          | ...     |


================================================
FILE: docs/ref/binary-formats.md
================================================
# Binary Formats in Revizor

!!! info "Advanced Topic"
    This is an advanced topic describing internal implementation details of Revizor. You are unlikely to need this information unless you are extending or modifying Revizor's core components.

This document describes the structure of the custom binary formats used by Revizor to transfer test cases and their data between different components, specifically for transferring generated test cases and their inputs to the executor kernel module and to the DynamoRIO-based model backend.

Such custom formats are necessary because the components are implemented in different programming languages and different technologies, so passing objects directly is not possible. Using one of the standard formats (e.g., ELF) is also not an option because test cases in Revizor have special structure (e.g., multiple actors in different execution modes, some instructions are macros, etc.) and this structure is not supported by the standard formats.

The formats are designed to as simple as possible to minimize the overhead of serialization and deserialization.

## Revizor Code Binary Format (RCBF)

RCBF is a structured representation of the complete test case binary, together with its metadata.
The structure is as follows:

``` yaml title="RCBF Structure" linenums="1"
HEADER (16 bytes total)
  n_actors:                8 bytes  # Number of Actors in the test case (also equals the number of code sections)
  n_symbols:               8 bytes  # Number of symbols in the test case

ACTOR TABLE (48 x n_actors bytes)
  actor_entry:             # (repeated n_actors times)
    id:                    8 bytes  # Unique identifier for the actor
    mode:                  8 bytes  # Execution mode of the actor
    pl:                    8 bytes  # Protection level
    data_permissions:      8 bytes  # Data access permissions
    data_ept_permissions:  8 bytes  # EPT (Extended Page Table) data permissions
    code_permissions:      8 bytes  # Code execution permissions

SYMBOL TABLE (32 x n_symbols bytes)
  symbol_entry:            # (repeated n_symbols times)
    owner:                 8 bytes  # ID of the actor that owns this symbol
    offset:                8 bytes  # (Offset of the symbol within its section
    id:                    8 bytes  # (Symbol's unique identifier
    args:                  8 bytes  # (Number of arguments the symbol takes (relevant for macros)

METADATA (24 x n_actors bytes)
  metadata_entry:
    owner:                 8 bytes  # (ID of the actor that owns this section
    size:                  8 bytes  # (Size of the code section in bytes
    reserved:              8 bytes  # (Reserved for future use

DATA (8 kB x n_actors bytes)
  code_section:            # (repeated n_actors times)
    code:                  8 kB     # (Actual assembled binary code for the section
```

The file begins with a header containing the number of actors (it is also the number of sections) and the number of symbols in the test case.
The term "symbol" in this context refers to any location in the test case that can be referenced.
Two common types of symbols are functions (specifically, function entry points) and macros.

Next, the file contains the actor table, which is an array of actor metadata entries, one for each actor in the test case.
The actor metadata entry contains the actor's ID, execution mode, protection level, data permissions, EPT data permissions, and code permissions.

After the actor table, the file contains the symbol table, which is an array of symbol entries, one for each symbol in the test case.
The symbol entry contains the ID the section to which the symbol belongs, the offset of the symbol within the section, the symbol's ID, and the number of arguments the symbol takes (if it is a macro).

The file continues with the table of metadata for each section in the test case.
Each metadata entry contains the ID of the actor that owns the section and the size of the section.

Finally, the file contains a sequence of code sections, one for each actor in the test case.
These sections contain the actual assembled binary for each of the sections in the test case.

## Revizor Data Binary Format (RDBF)

RDBF is a structured representation of the data used to initialize sandbox memory and registers before executing the test case.

Note that this format combines multiple inputs into a single file. This is done because typically, a single test case program is executed multiple times with different inputs, and so it is more efficient to send a batch of inputs at once.


``` yaml title="RDBF Structure" linenums="1"
HEADER (16 bytes)
  n_actors:               8 bytes  # Number of Actors in the test case (also equals the number of data sections)
  n_inputs:               8 bytes  # Number of inputs in the batch

METADATA (16 x n_actors bytes)
  metadata_entry:         # (repeated n_actors x n_inputs times)
    section_size:         8 bytes  # Size of the data section
    reserved:             8 bytes  # Reserved for future use

DATA (12 x n_actors x n_inputs KB)
  input:                  # (repeated n_inputs times)
    data_section:         # (repeated n_actors times)
      main_area:          4 KB  # Main data area
      faulty_area:        4 KB  # Faulty page area
      reg_init_region:    4 KB  # Register initialization area
```

The file begins with a section containing the number of actors (equal to the number of sections) and the number of inputs in the batch.

Next, the file contains the table of metadata for each data section, which only contains the size of the section.

Finally, the file contains a sequence of data sections, one for each actor in the test case and each input in the batch. The data sections are arranged to mirror the data layout in the sandbox memory (see the [sandbox memory layout](sandbox.md) document for more information).


================================================
FILE: docs/ref/cli.md
================================================
# Command-Line Interface

This document provides a complete reference for all command-line options accepted by the `rvzr` command (or `./revizor.py` if running directly from the source tree).

!!! note "CLI vs Configuration Files"
    Revizor is controlled via two interfaces: command line arguments and a configuration file.
    Command line arguments specify the mode of operation and set high-level parameters (e.g., file paths, number of fuzzing rounds), while the configuration file specifies details of the fuzzing campaign (e.g., the target contract, generation parameters, etc). This document focuses on the former; for information on configuration files, see the [configuration documentation](config.md).


## General Syntax

The general syntax of the command line is:

```
rvzr MODE [OPTIONS]

# Where MODE can be:
#   fuzz            fuzzing mode
#   tfuzz           template fuzzing mode
#   reproduce       reproduce mode
#   minimize        test case minimization mode
#   analyse         stand-alone trace analysis mode
#   generate        stand-alone generation mode
#   download_spec   call the script that downloads the instruction set specification
```

The available options depend on the selected mode. See [Execution Modes](modes.md) for descriptions of each mode's purpose and behavior.

For example, a typical way to run Revizor is in fuzzing mode with a command like this:

```bash
rvzr fuzz -s base.json -n 100 -i 10  -c config.yaml -w ./violations
```

This command will run the fuzzer for 100 iterations (i.e., 100 test cases), with 10 inputs per test case.
The fuzzer will use the ISA spec stored in the `base.json` file, and will read the configuration from `config.yaml`. If the fuzzer finds a violation, it will be stored in the `./violations` directory.


## Fuzzing Mode

Command-line arguments supported in `fuzz` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  -n NUM_TEST_CASES, --num-test-cases NUM_TEST_CASES
                        Number of test cases.
  -i NUM_INPUTS, --num-inputs NUM_INPUTS
                        Number of inputs per test case.
  -w WORKING_DIRECTORY, --working-directory WORKING_DIRECTORY
  -t TESTCASE, --testcase TESTCASE
                        Use an existing test case [DEPRECATED - see reproduce]
  --timeout TIMEOUT     Run fuzzing with a time limit [seconds]. No timeout when set to zero.
  --nonstop             Don't stop after detecting an unexpected result
  --save-violations SAVE_VIOLATIONS
                        If set, store all detected violations in working directory.
```

## Template Fuzzing Mode

Command-line arguments supported in `tfuzz` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received
                        via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  -n NUM_TEST_CASES, --num-test-cases NUM_TEST_CASES
                        Number of test cases.
  -i NUM_INPUTS, --num-inputs NUM_INPUTS
                        Number of inputs per test case.
  -w WORKING_DIRECTORY, --working-directory WORKING_DIRECTORY
  -t TEMPLATE, --template TEMPLATE
                        The template to use for generating test cases
  --timeout TIMEOUT     Run fuzzing with a time limit [seconds]. No timeout when set to zero.
  --nonstop             Don't stop after detecting an unexpected result
  --save-violations SAVE_VIOLATIONS
                        If set, store all detected violations in working directory.
```

## Reproduce Mode

Command-line arguments supported in `reproduce` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received
                        via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  -t TESTCASE, --testcase TESTCASE
                        Path to the test case
  -i [INPUTS ...], --inputs [INPUTS ...]
                        Path to the directory with inputs
  -n NUM_INPUTS, --num-inputs NUM_INPUTS
                        Number of inputs per test case. [IGNORED if --input-dir is set]
```

## Minimize Mode

Command-line arguments supported in `minimize` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received
                        via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  --testcase TESTCASE, -t TESTCASE
                        Path to the test case program that needs to be minimized.
  -i NUM_INPUTS, --num-inputs NUM_INPUTS
                        Number of inputs to the program that will be used during minimization.
  --testcase-outfile TESTCASE_OUTFILE, -o TESTCASE_OUTFILE
                        Output path for the minimized test case program.
  --input-outdir INPUT_OUTDIR
                        Output directory for storing minimized inputs.
  --num-attempts NUM_ATTEMPTS
                        Number of attempts to minimize the test case.
  --enable-<pass>       Enable a specific pass during minimization.
```

See also the [minimization documentation](minimization-passes.md) for a list of available minimization passes.

## Stand-alone Trace Analysis

Command-line arguments supported in `analyse` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received
                        via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  --ctraces CTRACES
  --htraces HTRACES
```

## Stand-alone Generation

Command-line arguments supported in `generate` mode:

```
  -h, --help            show this help message and exit
  -c CONFIG, --config CONFIG
                        Path to the configuration file (YAML) that will be used during fuzzing.
  -I INCLUDE_DIR, --include-dir INCLUDE_DIR
                        Path to the directory containing configuration files that included by the main configuration file (received
                        via --config).
  -s INSTRUCTION_SET, --instruction-set INSTRUCTION_SET
                        Path to the instruction set specification (JSON) file.
  -r SEED, --seed SEED  Add seed to generate test case.
  -n NUM_TEST_CASES, --num-test-cases NUM_TEST_CASES
                        Number of test cases.
  -i NUM_INPUTS, --num-inputs NUM_INPUTS
                        Number of inputs per test case.
  -w WORKING_DIRECTORY, --working-directory WORKING_DIRECTORY
  --permit-overwrite    Permit overwriting existing files.
```

### Download Instruction Set Specification

The following command-line arguments are supported in `download_spec` mode:

```
  -h, --help            show this help message and exit
  -a ARCHITECTURE, --architecture ARCHITECTURE   The ISA to download the specification for (e.g., x86-64)
  --outfile OUTFILE, -o OUTFILE   The destination file to save the downloaded specification.
  --extensions [EXTENSIONS ...]   List of ISA extensions to include in the specification (e.g., SSE, VTX)
```


================================================
FILE: docs/ref/config.md
================================================
# Configuration Options

Below is a list of the available configuration options for Revizor, which are passed down to Revizor via a config file.

For an example of how to write the config file, see [demo/big-fuzz.yaml](https://github.com/microsoft/side-channel-fuzzer/tree/main/demo/big-fuzz.yaml).


## <a name="fuzzer"></a> Fuzzing Configuration

#### `fuzzer`

:   <span class="inline-box" title="Default Value">:material-water:`basic`</span> Select the variant of a fuzzer to be used.

    === "Syntax"
        ```yaml
        fuzzer: <mode>
        ```
    === "Available Options"
        `basic` | `architectural` | `archdiff`
    === "Options Explained"
        * `basic` - normal model-based fuzzing. A violation in this mode indicates that the CPU
        exposes more information than predicted by the contract. This option should be used in most
        testing campaigns.
        * `architectural` - self-fuzzing for architectural mismatches between the model and the executor.
        This option should be used for testing the fuzzer itself, i.e., a violation in this
        mode indicates a bug in the fuzzer rather then a bug in the CPU. This is useful when running
        the fuzzer with a previously-untested instruction set, or when a new contract is implemented.
        * `archdiff` - fuzzing for architectural invariants. This is a special mode targeted for
        for semi-microarchitectural violations, similar to ZenBleed. This mode is experimental and
        should be used with caution.

#### `enable_priming`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> This option enables or disables priming. It should be set to True in most cases, as priming is crucial for eliminating false positives.

:    **What is priming?**: Priming solves the following problem: Revizor collects hardware traces for inputs in a sequence,
    and the microarchitectural state is not reset between the inputs. This means that the microarchitectural
    state for the input at, for example, position 100 is different from the state for the input at position 200.
    Accordingly, the hardware traces for these inputs may differ because the measurements are taken in different
    microarchitectural contexts.

:    To address this issue, we use priming, which swaps the inputs in the sequence and re-runs the tests.
    For example, if the original sequence is `(i1 . . . i99,i100,i101 . . . i199,i200)`, the priming
    sequence will be `(i1 . . . i99,i200,i101 . . . i199,i100)`. If the violation persists in this
    sequence, it is a true positive. If the violation disappears, it is a false positive, and it
    will be discarded.

    === "Syntax"
        ```yaml
        enable_priming: <True|False>
        ```

#### `enable_speculation_filter`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> If enabled, Revizor will not consider test cases that do not trigger speculation.

:    This option is useful for improving the throughput of the fuzzer, but it can discard potential violations if the leakage is not caused by speculation.

    === "Syntax"
        ```yaml
        enable_speculation_filter: <True|False>
        ```

#### `enable_observation_filter`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> If enabled, Revizor will not consider test cases that do not leave speculative traces.
    This is achieved by pre-filtering: For each test case, Revizor adds an `LFENCE` after each instruction in the test case, and compares the resulting hardware traces with the original. If the traces are identical, the test case is discarded without further processing.

:   This option is useful for improving the throughput of the fuzzer, but it can discard potential violations if the leakage is not caused by speculation.

    === "Syntax"
        ```yaml
        enable_observation_filter: <True|False>
        ```

#### `enable_fast_path_model`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> If enabled, the fuzzer will assume that all boosted inputs produce the same contract trace, and thus it will re-use the contract trace of the original input for all its boosted variants. This is normally a valid assumption to make if the taint tracker in the model does not contain bugs.

:   This option is a pure performance optimization. It only impacts the speed of fuzzing, and not its correctness.

    === "Syntax"
        ```yaml
        enable_fast_path_model: <True|False>
        ```

#### `color`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> If enabled, the output will be colored.
This option is helps a lot with readability, but may produce corrupted output when redirected to a file.

    === "Syntax"
        ```yaml
        color: <True|False>
        ```

#### `logging_modes`

:   <span class="inline-box" title="Default Value">:material-water: `['info', 'stat']`</span> Control the information logged by Revizor.

    === "Syntax"
        ```yaml
        logging_modes:
          - <mode1>
          - <mode2>
          ...
        ```
    === "Available Options"
        `info` | `stat` | `dbg_timestamp` | `dbg_violation` | `dbg_dump_htraces` | `dbg_dump_ctraces` | `dbg_dump_traces_unlimited` | `dbg_executor_raw` | `dbg_model` | `dbg_coverage` | `dbg_generator` | `dbg_priming` | `dbg_isa_filter`
    === "Options Explained"
        * `info` - general information about the progress of fuzzing;
        * `stat` - statistics the end of the fuzzing campaign;
        * `dbg_timestamp` - every 1000 test cases print the timestamp during the fuzzing process;
        * `dbg_violation` - upon detecting a violation, print detailed information about it;
        * `dbg_dump_htraces` - print the first 100 hardware traces for every test case;
        * `dbg_dump_ctraces` - print the first 100 contract traces for every test case;
        * `dbg_dump_traces_unlimited` - print ALL traces (use carefully, produces LOTS of text);
        * `dbg_executor_raw` - prints hardware traces for every stage of the fuzzing process;
        this differs from `dbg_dump_htraces` in that it prints the traces collected by
        speculation/observation filters as well as at every iteration of multi-sample collection;
        * `dbg_model` - print a detailed info about EVERY instruction executed on the model (use carefully, produces LOTS of text);
        * `dbg_coverage` - stores instruction coverage information;
        * `dbg_generator` - prints a list of instructions used to generate test cases;
        * `dbg_priming` - prints information about the priming process; only useful for debugging the priming mechanism itself.
        * `dbg_isa_filter` - when rvzr loads information about the instruction set (normally, from `base.json`), it filters out some of the instructions, either because of the config options provided by the user, or because some instructions are known to cause issues in the model or executor. This debug option prints the list of instructions that were filtered out, along with the reason for filtering them out.

#### `multiline_output`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> If enabled, each output message will be printed on a separate line. Otherwise, the fuzzing progress will be continuously overwriting the same line (works only in the terminal).

    === "Syntax"
        ```yaml
        enable_priming: <True|False>
        ```

## <a name="code-generator"></a> Program Generator Configuration

#### `generator`

:   <span class="inline-box" title="Default Value">:material-water: `random`</span> Select the type of program generator to be used.

    === "Syntax"
        ```yaml
        generator: <type>
        ```
    === "Available Options"
        `random`
    === "Options Explained"
        * `random` - generate random assembly programs. This is the only supported option at the moment.

#### `instruction_set`

:   <span class="inline-box" title="Default Value is Chosen Automatically Based on the Target CPU">:octicons-cpu-24:</span> The instruction set under test.

    === "Syntax"
        ```yaml
        instruction_set: <isa>
        ```
    === "Available Options"
        `x86-64` | `arm64`

#### `instruction_categories`

:   <span class="inline-box" title="Default Value is Chosen Automatically Based on the Target CPU">:octicons-cpu-24:</span> Select a list of instruction categories to be used when generating programs. This list effectively filters out instructions from the ISA descriptor file (e.g., `base.json`) passed via the command line (`-s`).

    !!! info "Priority"
        This list has higher priority than `instruction_blocklist` but lower than `instruction_allowlist`.

        The resulting instruction pool is:
        `all from(instruction_categories) - instruction_blocklist + instruction_allowlist`

    === "Syntax"
        ```yaml
        instruction_categories:
          - <category1>
          - <category2>
          ...
        ```
    === "Available Options"
        Any category in the ISA descriptor file (`base.json`).

#### `instruction_blocklist`

:   <span class="inline-box" title="Default Value is Chosen Automatically Based on the Target CPU">:octicons-cpu-24:</span> A list of instructions that will **not** be used for generating programs. This list filters out instructions from `instruction_categories`, but not from `instruction_allowlist`.

    !!! info "Priority"
        This list has lower priority than `instruction_allowlist`.

        The resulting instruction pool is:
        `all from(instruction_categories) - instruction_blocklist + instruction_allowlist`

    !!! warning "Danger Zone"
        This option has a somewhat sensible default value for each supported architecture, selected to avoid known-bad instructions. Thus, setting this option explicitly is unadvisable. Prefer using `instruction_blocklist_append` to add more instructions to the default blocklist.

    === "Syntax"
        ```yaml
        instruction_blocklist:
          - <instruction1>
          - <instruction2>
          ...
        ```
    === "Available Options"
        Any instruction in the ISA descriptor file (`base.json`).

#### `instruction_blocklist_append`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> A list of instructions that will be appended to the default blocklist for the target ISA. This option is identical to `instruction_blocklist`, but the list is added to the default instead of replacing it.

    !!! info "Priority"
        This list has lower priority than `instruction_allowlist`.

        The resulting instruction pool is:
        `all from(instruction_categories) - instruction_blocklist + instruction_allowlist`

    === "Syntax"
        ```yaml
        instruction_blocklist_append:
          - <instruction1>
          - <instruction2>
          ...
        ```
    === "Available Options"
        Any instruction in the ISA descriptor file (`base.json`).

#### `instruction_allowlist`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> A list of instructions to use for generating programs.

    !!! info "Priority"
        This list has priority over `instruction_categories` and over `instruction_blocklist`, thus adding instructions on top of the categories.

        The resulting instruction pool is:
        `all from(instruction_categories) - instruction_blocklist + instruction_allowlist`

    === "Syntax"
        ```yaml
        instruction_allowlist:
          - <instruction1>
          - <instruction2>
          ...
        ```
    === "Available Options"
        Any instruction in the ISA descriptor file (`base.json`).

#### `program_generator_seed`

:   <span class="inline-box" title="Default Value">:material-water: `0`</span> Seed of the program generator (aka code generator). If set to zero, a random seed will be used for each run.

    === "Syntax"
        ```yaml
        program_generator_seed: <seed>
        ```

#### `program_size`

:   <span class="inline-box" title="Default Value">:material-water: `24`</span> Number of instructions in the test case programs to be produced by the code generator. Note that the actual size might be larger because of the instrumentation.

    === "Syntax"
        ```yaml
        program_size: <size>
        ```

#### `avg_mem_accesses`

:   <span class="inline-box" title="Default Value">:material-water: `12`</span> Average number of memory accesses in the test case programs to be produced by the code generator. The actual number will be random, but the average over all programs will be close to this value.

    === "Syntax"
        ```yaml
        avg_mem_accesses: <count>
        ```

#### `min_bb_per_function`

:   <span class="inline-box" title="Default Value">:material-water: `1`</span> Minimal number of basic blocks per function in generated programs.

    === "Syntax"
        ```yaml
        min_bb_per_function: <count>
        ```

#### `max_bb_per_function`

:   <span class="inline-box" title="Default Value">:material-water: `2`</span> Maximal number of basic blocks per function in generated programs.

    === "Syntax"
        ```yaml
        max_bb_per_function: <count>
        ```

#### `min_successors_per_bb`

:   <span class="inline-box" title="Default Value">:material-water: `2`</span> Minimal number of successors for each basic block in generated programs.

    !!! note "Hint, not a rule"
        This option is a *hint*; it could be overwritten

        * if the instruction set does not have the necessary instructions to satisfy it
        * if a certain number of successor is required for correctness.
        * if min_successors_per_bb > max_successors_per_bb, the value is overwritten with max_successors_per_bb

    === "Syntax"
        ```yaml
        min_successors_per_bb: <count>
        ```

#### `max_successors_per_bb`

:   <span class="inline-box" title="Default Value">:material-water: `2`</span> Maximal number of successors for each basic block in generated programs.

    !!! note "Hint, not a rule"
        This option is a *hint*; it could be overwritten

        *  if the instruction set does not have the necessary instructions to satisfy it
        *  if a certain number of successor is required for correctness

    === "Syntax"
        ```yaml
        max_successors_per_bb: <count>
        ```

#### `register_allowlist`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> A list of registers that **can** be used for generating programs.

    !!! info "Priority"
        This list has higher priority than `register_blocklist`. The resulting list is: `(all registers - register_blocklist) + register_allowlist`.

    === "Syntax"
        ```yaml
        register_allowlist:
          - <register1>
          - <register2>
          ...
        ```
    === "Available Options"
        Any register supported by the target CPU.

#### `register_blocklist`

:   <span class="inline-box" title="Default Value is Chosen Automatically Based on the Target CPU">:octicons-cpu-24:</span> A list of registers that will **not** be used for generating programs.

    !!! info "Priority"
        This list has lower priority than `register_allowlist`. The resulting list is: `(all registers - register_blocklist) + register_allowlist`.

    !!! warning "Danger Zone"
        The default value of this option includes registers that reserved for internal use by the executor, and thus should be avoided. Modifying this option may lead to a full system crash.

    === "Syntax"
        ```yaml
        register_blocklist:
          - <register1>
          - <register2>
          ...
        ```
    === "Available Options"
        Any register supported by the target CPU.

#### `faults_allowlist`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> By default, the generator will produce programs that never trigger exceptions. This option modifies this behavior by permitting the generator to produce 'unsafe' instruction sequences that could potentially trigger an exception. The model and executor will also be configured to handle these exceptions gracefully.

    === "Syntax"
        ```yaml
        faults_allowlist:
          - <fault1>
          - <fault2>
          ...
        ```
    === "Available Options"
        `div-by-zero` | `div-overflow` | `opcode-undefined` | `breakpoint` | `debug-register` | `non-canonical-access` | `user-to-kernel-access`
    === "Options Explained"
        * `div-by-zero` - generate divisions with unmasked divisor, which can cause a division by zero exception.
        * `div-overflow` - generate divisions with unmasked dividend, which can cause an overflow exception.
        * `opcode-undefined` - generate undefined opcodes, which can cause an undefined opcode exception.
        * `breakpoint` - generate breakpoints, which can cause INT3 exceptions.
        * `debug-register` - generate instructions that cause INT1 exceptions.
        * `non-canonical-access` - randomly select a memory access in a generated program and instrument it to access a non-canonical address.
        * `user-to-kernel-access` - randomly select memory access instructions in user-privilege actors and instrument them to access the kernel actor's (actor 0) memory. This creates cross-privilege-level memory access patterns useful for detecting CPU vulnerabilities like Meltdown. Requires at least one actor with `privilege_level: user`. The instrumentation modifies both the memory operands and the sandboxing masks to ensure accesses target the kernel's FAULTY data area.


## <a name="actor"></a> Actor Configuration

All actors are defined in the `actors` list, with the following syntax:

```yaml
actors:
  - <actor1_name>:
      <actor_option>: <value>
      <actor_option>:
        <sub_option1>: <value1>
        <sub_option2>: <value2>
      ...
  - <actor2_name>:
      ...
  ...
```

The following options are available for each actor:

#### `mode`

:   <span class="inline-box" title="Default Value">:material-water: `host`</span> The execution mode of the actor.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              mode: <mode>
        ```
    === "Available Options"
        `host` | `guest`
    === "Options Explained"
        * `host` - the actor runs in the normal, non-virtualized mode.
        * `guest` - the actor runs in a VM (one VM per actor).

#### `privilege_level`

:   <span class="inline-box" title="Default Value">:material-water: `kernel`</span> The privilege level of the actor.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              privilege_level: <level>
        ```
    === "Available Options"
        `user` | `kernel`
    === "Options Explained"
        * `user` - the actor runs in user mode (CPL=3).
        * `kernel` - the actor runs in kernel mode (CPL=0).

#### `data_properties`

:   <span class="inline-box" title="Default Value">:material-water: (see below)</span> The properties of the data memory used by the actor. These properties are applied only to the faulty page of the actor's data region (see [sandbox](../ref/sandbox.md) for details).

:   Note that the above properties are set in the host page tables for actors with `mode: host`, and in the guest page tables for actors with `mode: guest`.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              data_properties:
                present: <True|False>
                writable: <True|False>
                user: <True|False>
                accessed: <True|False>
                dirty: <True|False>
                executable: <True|False>
                reserved_bit: <True|False>
                randomized: <True|False>
        ```
    === "Available Options"
        `present` | `writable` | `user` | `accessed` | `dirty` | `executable` | `reserved_bit` | `randomized`
    === "Options Explained"
        * `present` [default: True] - the value of the Present bit in the page table entry.
        * `writable` [default: True] - the value of the Writable bit in the page table entry.
        * `user` [default: False] - the value of the User/Supervisor bit in the page table entry.
        * `accessed` [default: True] - the value of the Accessed bit in the page table entry.
        * `dirty` [default: True] - the value of the Dirty bit in the page table entry.
        * `executable` [default: False] - the value of the Executable bit in the page table entry.
        * `reserved_bit` [default: False] - the value of the Reserved bit in the page table entry.
        * `randomized` [default: False] - if true, the values of the above properties will be randomized for each test case.

#### `data_ept_properties`

:   <span class="inline-box" title="Default Value">:material-water: `(see below)`</span> The properties of the EPT entry used by the actor (on Intel) or the NPT entry (on AMD). These properties are applied only to the faulty page of the actor's data region (see [sandbox](../ref/sandbox.md) for details).

:   This property has no effect on actors with `mode: host`.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              data_ept_properties:
                present: <True|False>
                writable: <True|False>
                executable: <True|False>
                accessed: <True|False>
                dirty: <True|False>
                user: <True|False>
                reserved_bit: <True|False>
                randomized: <True|False>
        ```
    === "Available Options"
        `present` | `writable` | `executable` | `accessed` | `dirty` | `user` | `reserved_bit` | `randomized`
    === "Options Explained"
        * `present` [default: True] - the value of the Present bit in the EPT/NPT entry.
        * `writable` [default: True] - the value of the Writable bit in the EPT/NPT entry.
        * `executable` [default: False] - the value of the Executable bit in the EPT/NPT entry.
        * `accessed` [default: True] - the value of the Accessed bit in the EPT/NPT entry.
        * `dirty` [default: True] - the value of the Dirty bit in the EPT/NPT entry.
        * `user` [default: False] - the value of the User/Supervisor bit in the EPT/NPT entry.
        * `reserved_bit` [default: False] - the value of the Reserved bit in the EPT/NPT entry.
        * `randomized` [default: False] - if true, the values of the above properties will be randomized for each test case.

#### `observer`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> If enabled, the actor will be an observer actor, hence modelling an attacker. This option is only used if the contract is `noninterference`, and it is ignored otherwise.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              observer: <True|False>
        ```

#### `instruction_blocklist`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> Actor-specific instruction blocklist.

:   This option is useful when writing a test case template that uses multiple actors, and some actors should use a different set of instructions than the others. For example, if privileged instructions should be blocked for low-privilege actors.

    !!! info "Priority"
        This list has priority over the global `instruction_blocklist` and modifies the instruction pool for the specific actor.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              instruction_blocklist:
                - <instruction1>
                - <instruction2>
                ...
        ```

#### `fault_blocklist`

:   <span class="inline-box" title="Default Value">:material-water: `[]`</span> Actor-specific fault blocklist.

:   For example, when using `user-to-kernel-access`, you typically want to add it to the kernel actor's `fault_blocklist` to prevent the kernel from accessing its own memory (which would not be a cross-privilege access).

    !!! info "Priority"
        This list has priority over the global `faults_allowlist` and modifies the fault-inducing instrumentation for the specific actor.

    === "Syntax"
        ```yaml
        actors:
          - <actor_name>:
              fault_blocklist:
                - <fault1>
                - <fault2>
                ...
        ```
    === "Available Options"
        See [`faults_allowlist`](#faults_allowlist) for the list of available faults.


## <a name="data-generator"></a> Data Generator Configuration

#### `data_generator`

:   <span class="inline-box" title="Default Value">:material-water: `random`</span> Select the method of test case data generation.

    === "Syntax"
        ```yaml
        data_generator: <type>
        ```
    === "Available Options"
        `random`
    === "Options Explained"
        * `random` - generate random input data for the test cases. This is the only supported option at the moment.

#### `data_generator_seed`

:   <span class="inline-box" title="Default Value">:material-water: `10`</span> Seed of the test case data generator. If set to zero, a random seed will be used for each run.

    === "Syntax"
        ```yaml
        data_generator_seed: <seed>
        ```

#### `data_generator_entropy_bits`

:   <span class="inline-box" title="Default Value">:material-water: `31`</span> Entropy of the random values created by the data generator.

    === "Syntax"
        ```yaml
        data_generator_entropy_bits: <bits>
        ```
    === "Allowed Values"
        Integer in the range `[1, 31]`

#### `input_gen_probability_of_special_value`

:   <span class="inline-box" title="Default Value">:material-water: `0.05`</span> When set to a non-zero value, the data generator will occasionally produce special values (such as zero or MAX_INT) alongside random values, with the frequency controlled by this probability. These special values help exercise fast-path optimizations in the microarchitecture.

    === "Syntax"
        ```yaml
        input_gen_probability_of_special_value: <probability>
        ```
    === "Allowed Values"
        Float in the range `[0.0, 1.0]`

#### `inputs_per_class`

:   <span class="inline-box" title="Default Value">:material-water: `2`</span> Number of inputs generated for each input class via input boosting (aka Contract-Driven Input Generation). For the explanation of the input classes and the generation algorithm, see [this paper](https://arxiv.org/pdf/2301.07642), Section 4.D. Contract-driven Input Generator.

    === "Syntax"
        ```yaml
        inputs_per_class: <count>
        ```


## <a name="contract"></a> Contract Configuration

#### `contract_execution_clause`

:   <span class="inline-box" title="Default Value">:material-water: `['seq']`</span> The execution clause of the contract. Multiple clauses can be combined to form a more permissive contract.

    === "Syntax"
        ```yaml
        contract_execution_clause:
          - <clause>
        ```
    === "Available Options"
        `seq` | `no_speculation` | `seq-assist` | `cond` | `conditional_br_misprediction` | `bpas` | `nullinj-fault` | `nullinj-assist` | `delayed-exception-handling` | `div-zero` | `div-overflow` | `meltdown` | `fault-skip` | `noncanonical` | `vspec-ops-div` | `vspec-ops-memory-faults` | `vspec-ops-memory-assists` | `vspec-ops-gp` | `vspec-all-div` | `vspec-all-memory-faults` | `vspec-all-memory-assists`
    === "Options Explained"
        * `seq` - sequential execution.
        * `no_speculation` - sequential execution. Synonym for `seq`.
        * `seq-assist` - sequential execution with possible microcode assists.
        * `cond` - permitted misprediction of conditional branches.
        * `conditional_br_misprediction` - permitted misprediction of conditional branches. Synonym for `cond`.
        * `bpas` - permitted speculative store bypass
        * `nullinj-fault` - page faults are permitted to speculatively return zero.
        * `nullinj-assist` - microcode assists are permitted to speculatively return zero.
        * `delayed-exception-handling` - upon an exception or a fault, data-independent instructions that follow the exception are allowed to execute speculatively.
        * `meltdown` - permission-based page faults are permitted to speculatively return the value in the memory.
        * `fault-skip` - upon a fault, the faulting instruction is speculatively skipped.
        * `noncanonical` - permitted speculative non-canonical memory accesses.
        * `vspec*` - experimental contracts for value speculation. See [this paper](https://www.usenix.org/system/files/usenixsecurity23-hofmann.pdf) for details.
        * `div-zero` - experimental contract; do not use.
        * `div-overflow` - experimental contract; do not use.

#### `contract_observation_clause`

:   <span class="inline-box" title="Default Value">:material-water: `ct`</span> The observation clause of the contract. In most cases, the default value should be used.

    === "Syntax"
        ```yaml
        contract_observation_clause: <clause>
        ```
    === "Available Options"
        `none` | `l1d` | `memory` | `pc` | `ct` | `loads+stores+pc` | `ct-nonspecstore` | `ctr` | `arch` | `tct` | `tcto` | `ct-ni`
    === "Options Explained"
        * `none` - the model observes nothing. Useful for testing the fuzzer.
        * `l1d` - the model observes the addresses of data accesses, adjusted to imitate the L1D cache trace. Has very few real applications, and should be generally avoided.
        * `memory` - the model observes the addresses of data accesses.
        * `ct` (constant time tracer) - the model observes the addresses of data accesses and the control flow.
        * `loads+stores+pc` - the model observes the addresses of data accesses and the control flow. Synonym for `ct`.
        * `ct-nonspecstore` - the model observes the addresses of data accesses and the control flow, but does not observe the addresses of stores during speculation.
        * `ctr` - the model observes the addresses of data accesses and the control flow, as well as the values of the general-purpose registers.
        * `arch` - the model observes the addresses of data accesses and the control flow, as well as the values loaded from memory. This clause imitates the security guarantees provided by secure speculation mechanisms like STT.
        * `tct` (truncated constant time tracer) - the model observes address of the memory access and of the program counter at cache line granularity.
        * `tcto` (truncated constant time tracer with overflows) - the model address of the memory access and of the program counter at cache line granularity + observe cache line overflows.
        * `ct-ni` - (only available in multi-actor context) when executing actors with `observer: false`, the model observes the same data as as with `ct`. When executing actors with `observer: true`, the model observes complete memory of the actor as well as their register values.

#### `model_backend`

:   <span class="inline-box" title="Default Value">:material-water: `unicorn`</span> The backend used to implement the contract model.

    === "Syntax"
        ```yaml
        model_backend: <backend>
        ```
    === "Available Options"
        `dummy` | `unicorn` | `dynamorio`
    === "Options Explained"
        * `unicorn` - use Unicorn-based implementation of the model. This backend is more mature and feature-rich, but it supports a considerably smaller set of instruction than DynamoRIO (essentially, only the base x86 or ARM instruction sets, without any extensions).
        * `dynamorio` - use DynamoRIO-based implementation of the model. This backend is less mature and supports fewer contracts and features than Unicorn, but it can handle a much larger set of instructions, including complex extensions like AVX-512 on x86-64. It is also generally faster than Unicorn, especially when testing large test case or running with many inputs per test case.
        * `dummy` - use a dummy model. This model always returns the same (empty) contract trace, and as such will not produce meaningful results. This option is useful, however, when root-causing violations, because it allows to collect hardware traces without running the model, hence allowing to trace instructions that are not supported by any of the backends.

#### `model_min_nesting`

:   <span class="inline-box" title="Default Value">:material-water: `1`</span> Minimum number of nested mispredictions in the model. This value is used to generate the contract traces on the fast path of the fuzzer. Chose a small value when speculation is rare, and a larger value when speculation is common.

:   This option is a pure performance optimization. It only impacts the speed of fuzzing, and not its correctness.

    === "Syntax"
        ```yaml
        model_min_nesting: <depth>
        ```

#### `model_max_nesting`

:   <span class="inline-box" title="Default Value">:material-water: `30`</span> Maximum number of nested mispredictions in the model. This value is used to generate the contract traces on the slow path of the fuzzer, i.e., when a potential violation is detected and the fuzzer tries to check if it is a true positive.

:   In contrast to `model_min_nesting`, this option could cause false positives if set too low. Thus, it is advisable to set it to a sufficiently high value to cover all possible nested mispredictions in the test cases. Leave the default unless you are sure that a lower value is sufficient.

    === "Syntax"
        ```yaml
        model_max_nesting: <depth>
        ```

#### `model_max_spec_window`

:   <span class="inline-box" title="Default Value">:material-water: `250`</span> Size of the speculation window in the model.

:    This option sets a trade-off between accuracy and performance. A larger speculation window avoids potential false positives due to inaccurate modelling of the speculation, but it also slows down the model execution. Leave the default unless you are sure that a different value is needed.

    === "Syntax"
        ```yaml
        model_max_spec_window: <size>
        ```

## <a name="executor"></a> Executor Configuration

#### `executor`

:   <span class="inline-box" title="Default Value is Chosen Automatically Based on the Target CPU">:octicons-cpu-24:</span> ISA-specific version of the executor to use. The default value is auto-detected based on `cpuinfo`. Should be changed only if the auto-detection fails.

    === "Syntax"
        ```yaml
        executor: <type>
        ```
    === "Available Options"
        `x86-64-intel` | `x86-64-amd` | `arm64`

#### `executor_mode`

:   <span class="inline-box" title="Default Value">:material-water: `P+P`</span> Method of collecting hardware traces in the executor. The method determines the contents of hardware traces.

    === "Syntax"
        ```yaml
        executor_mode: <mode>
        ```
    === "Available Options"
        `P+P` | `F+R` | `E+R` | `PP+P` | `TSC`
    === "Options Explained"
        * `P+P` - prime and probe side-channel attack. The hardware traces contain the cache sets that were accessed during the execution of the test case.
        * `F+R` - flush and reload side-channel attack. The hardware traces contain the memory addresses that were accessed during the execution of the test case.
        * `E+R` - evict and reload side-channel attack. The hardware traces contain the cache sets that were accessed during the execution of the test case.
        * `PP+P` - partial prime and probe (i.e., leave a subset of cache lines unprimed). The hardware traces contain the cache sets that were accessed during the execution of the test case.
        * `TSC` - use `RDTSCP` instruction to measure the execution time of test cases. The hardware traces contain the execution time, in cycles.

#### `executor_warmups`

:   <span class="inline-box" title="Default Value">:material-water: `5`</span> Number of warmup rounds executed before starting to collect hardware traces.

    === "Syntax"
        ```yaml
        executor_warmups: <count>
        ```

#### `executor_sample_sizes`

:   <span class="inline-box" title="Default Value">:material-water: `[10, 50, 100, 500]`</span> A list of sample sizes to be used during the measurements.

    !!! info "Clarification"
        Executor normally performs measurements multiple times for each test case in order to collect a sample of hardware traces. This allows Revizor to tolerate noise and non-determinism in the measurements by applying statistical methods for comparing the traces.

        For performance reasons, Revizor does not immediately use a large sample size. Instead, it starts with a small sample, collects the traces, and checks if a violation is detected. If no violation is detected, the executor assumes that the test case is safe, and moves on to the next one. If a violation is detected, however, the executor tries to reproduce it with larger sample sizes.

        This option defines the list of sample sizes through which Revizor will iterate in this process. To make it sensible, the list should be sorted in ascending order with a reasonable gap between the sizes.

    === "Syntax"
        ```yaml
        executor_sample_sizes:
          - <sample_size1>
          - <sample_size2>
          ...
        ```

#### `executor_filtering_repetitions`

:   <span class="inline-box" title="Default Value">:material-water: `10`</span> The sample size to be used by the speculation and observation filters.

    === "Syntax"
        ```yaml
        executor_filtering_repetitions: <count>
        ```

#### `executor_taskset`

:   <span class="inline-box" title="Default Value">:material-water: `0`</span> The CPU core ID which the executor will use for running test cases. That is, the executor process will be pinned to this core.

    === "Syntax"
        ```yaml
        executor_taskset: <core_id>
        ```

#### `enable_pre_run_flush`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> If enabled, the executor will do its best to flush the microarchitectural state before running test cases.

    === "Syntax"
        ```yaml
        enable_pre_run_flush: <True|False>
        ```

## <a name="analyser"></a> Analyser Configuration

#### `analyser`

:   <span class="inline-box" title="Default Value">:material-water: `chi2`</span> The type of the analyser that is used to compare hardware traces against contract traces.

    === "Syntax"
        ```yaml
        analyser: <type>
        ```
    === "Available Options"
        `chi2` | `mwu` | `sets` | `bitmaps`
    === "Options Explained"
        * `sets` - combine the hardware traces for each input into a set. A violation is reported if two inputs in the same contract-equivalence class have different sets of hardware traces.
        * `bitmaps` - combine the hardware traces for each input into a bitmap. A violation is reported if two inputs in the same contract-equivalence class have different bitmaps of hardware traces.
        * `chi2` - use the chi-squared homogeneity test to compare the hardware traces of inputs in the same contract-equivalence class. This test effectively checks if the hardware traces from two different inputs come from the same distribution. A violation is reported if the test fails.
        * `mwu` - [experimental; both false positives and negatives are possible] use the Mann-Whitney U test to compare the hardware traces of inputs in the same contract-equivalence class. This test effectively checks if the hardware traces from two different inputs come from the same distribution. A violation is reported if the test fails.

#### `analyser_subsets_is_violation`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> This option is relevant only for the `sets` and `bitmaps` analysers. If enabled, the analyser will not label hardware traces as mismatching if they form a subset relation.

    === "Syntax"
        ```yaml
        analyser_subsets_is_violation: <True|False>
        ```

#### `analyser_outliers_threshold`

:   <span class="inline-box" title="Default Value">:material-water: `0.1`</span> This option is relevant only for the `sets` and `bitmaps` analysers. The analyser will ignore the hardware traces that appear in less than this percentage of the sampled traces.

    === "Syntax"
        ```yaml
        analyser_outliers_threshold: <threshold>
        ```

#### `analyser_stat_threshold`

:   <span class="inline-box" title="Default Value">:material-water: `0.5`</span> This option is relevant only for the `chi2` and `mwu` analysers. The threshold for the statistical tests. If a pair of hardware traces has the (normalized) statistics below the threshold, then the traces are considered equivalent.

:   For the chi2 test, the threshold is applied to the `statistics / (len(htrace1) + len(htrace2))`.

:   For the mwu test, the threshold is applied to the p-value.

    === "Syntax"
        ```yaml
        analyser_stat_threshold: <threshold>
        ```

## <a name="misc"></a> Miscellaneous Configuration

#### `coverage_type`

:   <span class="inline-box" title="Default Value">:material-water: `none`</span> The type of coverage tracking.

    === "Syntax"
        ```yaml
        coverage_type: <type>
        ```
    === "Available Options"
        `none` | `model_instructions`
    === "Options Explained"
        * `none` - disable coverage tracking.
        * `model_instructions` - track how many times the model executed each instruction in the target ISA.

#### `minimizer_retries`

:   <span class="inline-box" title="Default Value">:material-water: `1`</span> Number of minimization retries. When the minimizer performs a check to reduce a test case, each check is attempted this number of times and it succeeds if at least one check is successful.

    === "Syntax"
        ```yaml
        minimizer_retries: <count>
        ```

## Unique x86-64 Options


#### `x86_executor_enable_ssbp_patch`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> Enable a microcode patch against Speculative Store Bypass, if available.

    === "Syntax"
        ```yaml
        x86_executor_enable_ssbp_patch: <True|False>
        ```

#### `x86_executor_enable_prefetcher`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> Enable all prefetchers, if the software controls are available.

    === "Syntax"
        ```yaml
        x86_executor_enable_prefetcher: <True|False>
        ```

#### `x86_disable_div64`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> Do not generate 64-bit division instructions. Useful for avoiding certain types of speculation that are specific to 64-bit division.

    === "Syntax"
        ```yaml
        x86_disable_div64: <True|False>
        ```

#### `x86_enable_hpa_gpa_collisions`

:   <span class="inline-box" title="Default Value">:material-water: `False`</span> When a test case contains at least one guest actor, allocate its memory in the guest physical address space to match the corresponding host physical addresses of the main actor. Useful for testing Foreshadow-like leaks.

    === "Syntax"
        ```yaml
        x86_enable_hpa_gpa_collisions: <True|False>
        ```

#### `x86_generator_align_locks`

:   <span class="inline-box" title="Default Value">:material-water: `True`</span> When generating memory accesses with locks, apply instrumentation to align the locks to 8 bytes. Useful for avoiding faults on unaligned accesses.

    === "Syntax"
        ```yaml
        x86_generator_align_locks: <True|False>
        ```

---

## What's Next?

- [Command Line Interface](cli.md) - CLI options and modes
- [demo/big-fuzz.yaml](https://github.com/microsoft/side-channel-fuzzer/tree/main/demo/big-fuzz.yaml) - Comprehensive example configuration
- [demo/](https://github.com/microsoft/side-channel-fuzzer/tree/main/demo/) - Example configurations for various scenarios


================================================
FILE: docs/ref/index.md
================================================
# Reference Documentation

Complete technical reference for all Revizor components, commands, configuration options, and formats.

## User-Facing Components

* [Command Line Interface](cli.md)
Complete reference for all `rvzr` command-line options and arguments. Covers common options and mode-specific parameters.
* [Execution Modes](modes.md)
Detailed specifications for all execution modes: fuzzing, template fuzzing, reproduce, minimize, analyse, generate, and download_spec.

* [Configuration Options](config.md)
Complete reference for all configuration file parameters organized by component: fuzzer, generator, executor, model, analyser, and actors.

* [Macros Reference](macros.md)
Complete reference for all template macros including measurement control, fault handling, code generation, and actor transitions.

* [Minimization Passes](minimization-passes.md)
Complete list of available minimization passes for reducing test case complexity while preserving violations.

## Architecture & Internals

Low-level technical references for Revizor's internal components.

* [Binary Formats](binary-formats.md)
Specifications for Revizor's binary file formats: RCBF (Revizor Contract Binary Format) and RDBF (Revizor DynamoRIO Binary Format).

* [Registers](registers.md)
Register specifications and conventions for x86-64 and ARM64 architectures.

* [Sandbox](sandbox.md)
Memory layout and sandboxing mechanisms used during test execution.


================================================
FILE: docs/ref/macros.md
================================================
# Macros

This document provides a complete reference for all macros available in Revizor.

!!! note "Related Documentation"
    This document is intended as a reference; if you're looking for a practical guide on how to use the `macros`, please refer to [How-To: Use Macros](../howto/use-macros.md).

## Overview

Macros are special pseudo-instructions in assembly test cases that appear as labels with the `.macro` prefix. They are dynamically expanded into actual implementations during execution by the model and executor. Macros enable complex operations like domain transitions, measurement control, and random code generation within test cases.

Macros accept up to four static arguments. Arguments are strictly static (either a constant integer or a string); dynamic values (registers, memory addresses) are not supported.

=== "Syntax"

    ```assembly
    .macro.<macro_name>.<argument1>.<argument2>.<argument3>.<argument4>:
    ```

=== "Example"

    ```assembly
    ; Macro to switch execution to
    ; a function called `main` that belongs to the actor `actor_2`
    .macro.switch.user.function_user_0:
    ```

## Measurement Macros

Control the start and end of hardware and contract trace collection.

#### <a name="measurement_start"></a> `measurement_start`

:   Begins hardware and contract trace collection. Instructions before this macro are executed but not included in the contract/hardware traces.

    === "Syntax"
        ```assembly
        .macro.measurement_start:

        ; alternative
        .macro.measurement_start.<label>:
        ```

    === "Arguments"
        1. `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="measurement_end"></a> `measurement_end`

:   Ends hardware and contract trace collection. Instructions after this macro are executed but not included in the contract/hardware traces.

    === "Syntax"
        ```assembly
        .macro.measurement_end:

        ; alternative
        .macro.measurement_end.<label>:
        ```

    === "Arguments"
        1. `label` (optional): Unique identifier if the macro is used multiple times


## Transition Macros

Switch between different actors and privilege levels, including kernel-user and host-guest transitions.

#### <a name="set_h2g_target"></a> `set_h2g_target`

:   Sets the VM entry point for host-to-guest transitions.

    === "Syntax"
        ```assembly
        .macro.set_h2g_target.<actor_name>.<function_name>:
        ```

    === "Arguments"
        - `actor_name`: Target guest actor identifier
        - `function_name`: Entry point function in guest actor

#### <a name="set_g2h_target"></a> `set_g2h_target`

:   Sets the VM exit point for guest-to-host transitions.

    === "Syntax"
        ```assembly
        .macro.set_g2h_target.<actor_name>.<function_name>:
        ```

    === "Arguments"
        - `actor_name`: Target host actor identifier
        - `function_name`: Landing point function in host actor

#### <a name="switch_h2g"></a> `switch_h2g`

:   Performs host-to-guest transition (VM entry). The entry and exit point must be set beforehand using `set_h2g_target` and `set_g2h_target` macros.

    === "Syntax"
        ```assembly
        .macro.switch_h2g.<actor_name>.<label>:
        ```

    === "Arguments"
        - `actor_name`: Target guest actor identifier
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="landing_h2g"></a> `landing_h2g`

:   Marks the guest landing point after host-to-guest transition. This macro works together with `switch_h2g` to ensure complete restoration of the execution context.

    === "Syntax"
        ```assembly
        .macro.landing_h2g.<label>:
        ```

    === "Arguments"
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="switch_g2h"></a> `switch_g2h`

:   Performs guest-to-host transition (VM exit). The entry and exit point must be set beforehand using `set_h2g_target` and `set_g2h_target` macros.

    === "Syntax"
        ```assembly
        .macro.switch_g2h.<actor_name>.<label>:
        ```

    === "Arguments"
        - `actor_name`: Target host actor identifier
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="landing_g2h"></a> `landing_g2h`

:   Marks the host landing point after guest-to-host transition. This macro works together with `switch_g2h` to ensure complete restoration of the execution context.

    === "Syntax"
        ```assembly
        .macro.landing_g2h.<label>:
        ```

    === "Arguments"
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="set_k2u_target"></a> `set_k2u_target`

:   Sets the user mode entry point for kernel-to-user transitions.

    === "Syntax"
        ```assembly
        .macro.set_k2u_target.<actor_name>.<function_name>:
        ```

    === "Arguments"
        - `actor_name`: Target user-mode actor identifier
        - `function_name`: Entry point function in user actor


#### <a name="set_u2k_target"></a> `set_u2k_target`

:   Sets the kernel mode entry point for user-to-kernel transitions.

    === "Syntax"
        ```assembly
        .macro.set_u2k_target.<actor_name>.<function_name>:
        ```

    === "Arguments"
        - `actor_name`: Target kernel-mode actor identifier
        - `function_name`: Entry point function in kernel actor


#### <a name="switch_k2u"></a> `switch_k2u`

:   Performs kernel-to-user transition (privilege level drop). The entry and exit point must be set beforehand using `set_k2u_target` and `set_u2k_target` macros.

    === "Syntax"
        ```assembly
        .macro.switch_k2u.<actor_name>.<label>:
        ```

    === "Arguments"
        - `actor_name`: Target user actor identifier
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="switch_u2k"></a> `switch_u2k`

:   Performs user-to-kernel transition (privilege level escalation). The entry and exit point must be set beforehand using `set_k2u_target` and `set_u2k_target` macros.

    === "Syntax"
        ```assembly
        .macro.switch_u2k.<actor_name>.<label>:
        ```

    === "Arguments"
        - `actor_name`: Target kernel actor identifier
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="landing_k2u"></a> `landing_k2u`

:   Marks the user-mode landing point after kernel-to-user transition.  This macro works together with `switch_k2u` to ensure complete restoration of the execution context.

    === "Syntax"
        ```assembly
        .macro.landing_k2u.<label>:
        ```

    === "Arguments"
        - `label` (optional): Unique identifier if the macro is used multiple times


#### <a name="landing_u2k"></a> `landing_u2k`

:   Marks the kernel-mode landing point after user-to-kernel transition.  This macro works together with `switch_u2k` to ensure complete restoration of the execution context.

    === "Syntax"
        ```assembly
        .macro.landing_u2k.<label>:
        ```

    === "Arguments"
        - `label` (optional): Unique identifier if the macro is used multiple times

## Fault Handling Macros

Define exception and interrupt handlers within test cases.

#### <a name="fault_handler"></a> `fault_handler`

:   Specifies the control flow target for exceptions and interrupts. When an exception occurs, control transfers to this location. If not defined, the executor uses a default handler that jumps to the test case exit point.

    === "Syntax"
        ```assembly
        .macro.fault_handler:
        ```

    === "Arguments"
        - None


## Environment Configuration Macros

Change the execution environment from within a test case.

#### <a name="set_data_permissions"></a> set_data_permissions

:   Configures data permission on the faulty page of the current actor by modifying the page table entry (PTE) permissions.

    === "Syntax"
        ```assembly
        .macro.set_data_permissions.<set_mask>.<clear_mask>:
        ```
    === "Arguments"
        - `set_mask`: 16-bit bitmask specifying which permission bits to set (ORed with the faulty page's PTE)
        - `clear_mask`: 16-bit bitmask specifying which permission bits to clear (ANDed with the faulty page's PTE)


## Generation Macros

Define automatically-generated points within a template. Available only in the [Template Fuzzing Mode](modes.md#tfuzz)

In contrast to the rest of the macros, generation macros are used by the generator instead of the executor or model. By the point the executor/model run the test case, these macros are expected to have been already expanded into actual code.

#### <a name="random_instructions"></a> `random_instructions`

:   Generates N random instructions during template expansion. Used in template fuzzing mode to insert randomized code sequences.

    === "Syntax"
        ```assembly
        .macro.random_instructions.<num_instructions>.<avg_mem_accesses>.<label>:
        ```

    === "Arguments"
        - `num_instructions`: Number of random instructions to generate
        - `avg_mem_accesses`: Average number of memory accesses. Average means that when a large-enough number of test cases are generated, the mean number of memory accesses per expansion of this macro will approximate this value.
        - `label` (optional): Unique identifier if the macro is used multiple times

---

## What's Next?

- [How to Use Macros](../howto/use-macros.md) - Detailed usage guide and implementation details
- [How to Use Templates](../howto/use-templates.md) - Template-based testing
- [Actors](../topics/actors.md) - Multi-domain testing concepts

**Examples:**

- [demo/tsa-l1d/template.asm](https://github.com/microsoft/side-channel-fuzzer/tree/main/demo/tsa-l1d/template.asm) - TSA-L1D attack template with actor transitions
- [demo/tsa-sq/template.asm](https://github.com/microsoft/side-channel-fuzzer/tree/main/demo/tsa-sq/template.asm) - TSA-SQ attack template with actor transitions


================================================
FILE: docs/ref/minimization-passes.md
================================================
# Minimization Passes

This document provides a detailed list of all available minimization features (passes) supported in the `minimize` execution mode of Revizor. These passes are used to simplify randomly generated violation artifacts to enable human analysis.

!!! note "Related Documentation"
    This document is intended as a reference; if you're looking for a practical guide on how to use the `minimize` mode, please refer to [How-To: Minimize Violation](../howto/minimize.md).

## Types of Passes

`minimize` mode supports three types of passes:

* program passes modify the program
* input passes modify the input sequence
* analysis passes provide additional information about the violation, usually by adding comments to the program.

## Program Passes

#### <a name="enable-instruction-pass"></a>`--enable-instruction-pass`

:   Enables the instruction minimization pass that iteratively removes instructions from the program while preserving the violation.

#### <a name="enable-simplification-pass"></a>`--enable-simplification-pass`

:   Enables the instruction simplification pass that replaces complex instructions with simpler ones while preserving the violation.

#### <a name="enable-nop-pass"></a>`--enable-nop-pass`

:   Enables the NOP replacement pass that iteratively replaces instructions with NOPs of the same size while preserving the violation.

#### <a name="enable-constant-pass"></a>`--enable-constant-pass`

:   Enables the constant simplification pass that replaces immediate arguments of instructions with 0s while preserving the violation.

#### <a name="enable-mask-pass"></a>`--enable-mask-pass`

:   Enables the mask simplification pass that reduces the size of the instrumentation masks while preserving the violation.

#### <a name="enable-label-pass"></a>`--enable-label-pass`

:   Enables the label removal pass that removes unused labels from the assembly file.

#### <a name="enable-fence-pass"></a>`--enable-fence-pass`

:   Enables the fence insertion pass that adds LFENCEs after instructions while preserving the violation.

## Input Passes

#### <a name="enable-input-seq-pass"></a>`--enable-input-seq-pass`

:   Enables the input sequence minimization pass that removes inputs from the original generated sequence while preserving the violation.

#### <a name="enable-input-diff-pass"></a>`--enable-input-diff-pass`

:   Enables the violating input difference minimization pass that operates on the pair of (contract-equivalent) inputs that triggered the violation and attempts to minimize the difference between the two inputs.
It does so by iterating over all bytes in the inputs, and (1) attempting to replace each byte with zero, and if it fails, (2) copying the byte from the first input to the second input.

## Analysis Passes

#### <a name="enable-source-analysis"></a>`--enable-source-analysis`

:   Enables the speculation source identification pass that analyzes the program to identify suspected sources of speculation, and adds the corresponding comments to the assembly file.
Note that the analysis is not guaranteed to be correct, and it may produce false results.

#### <a name="enable-comment-pass"></a>`--enable-comment-pass`

:   Enables the violation comment pass that adds comments to the assembly file with details about the violation.


================================================
FILE: docs/ref/modes.md
================================================
# Execution Modes

Revizor supports several modes of operation, each targeting a different use cases.
The selection of the mode is described in the [CLI documentation](cli.md).
Below is a brief description of each mode.

## Overview

| Mode             | CLI Key       | Use Case                      | Description                                                                                                |
| ---------------- | ------------- | ----------------------------- | ---------------------------------------------------------------------------------------------------------- |
| Fuzzing          | fuzz          | General Testing               | Test a CPU against a contract model. Test cases generated randomly                                         |
| Template Fuzzing | tfuzz         | Targeted Testing              | Test a CPU against a contract model. Test cases generated based on a template                              |
| Reproduce        | reproduce     | Reproducing a Violation       | Reproduce a violation found by fuzzing OR run a manually-written test case                                 |
| Minimization     | minimize      | Simplification of a Violation | Simplify a test case by applying a series of simplification passes to the test case program and its inputs |
| Trace Analysis   | analyse       | External Integration          | Analyze pre-recorded traces for violations                                                                 |
| Generation       | generate      | External Integration          | Only generate test cases, without testing them                                                             |
| ISA Spec Install | download_spec | Tool Installation             | Call a script that downloads the instruction set specification                                             |


## <a name="fuzz"></a> `fuzz`

=== "Syntax"
```bash
$ rvzr fuzz [OPTIONS]
```

:   Main fuzzing mode of Revizor.
In this mode, Revizor randomly generates test cases and executes them on the target CPU and the model, records the corresponding traces, and checks if the hardware traces contain the same (or less) information as the contract traces. That is, it implements [Model-Based Relational Testing](../intro/03-primer.md#model-based-relational-testing-and-revizor) approach.

:   **Use case:** Broad testing of CPU behavior against contract specifications.


## <a name="tfuzz"></a> `tfuzz`

=== "Syntax"
```bash
$ rvzr tfuzz [OPTIONS]
```

:   Similar to the fuzzing mode, but test cases are generated based on a template. For details on templates, see the [template fuzzing how-to guide](../howto/use-templates.md).

:   **Use case:** Targeted testing of specific scenarios, microarchitectural patches, or actor interactions.


## <a name="reproduce"></a> `reproduce`

=== "Syntax"
```bash
$ rvzr reproduce [OPTIONS]
```
:   In this mode, Revizor loads and executes a specific test case data and inputs from files. Performs single fuzzing round with the provided test case and inputs, and reports the results.

:   Test cases can be violations from previous fuzzing runs or manually-written test programs.

:   **Use cases:**

    - Checking reproducibility: Testing if a violation artifact can be consistently reproduced on other CPUs or configurations.
    - Verification of a violation: Confirming that a violation is genuine and not a false positive.
    - Manual testing: Executing a custom test case written by the user.
    - Root-causing: Checking the impact of manual modifications to a test case.


## <a name="minimize"></a> `minimize`

=== "Syntax"
```bash
$ rvzr minimize [OPTIONS]
```

:   In this mode, Revizor applies simplification passes to a violation test case, reducing program and input complexity while preserving the violation behavior.

:   **Use case:** Simplify violations for root cause analysis.


## <a name="analyse"></a> `analyse`

=== "Syntax"
```bash
$ rvzr analyse [OPTIONS]
```

:   In this mode, Revizor analyzes pre-recorded contract and hardware traces for violations without executing test cases.
Accepts trace files as input and applies the configured analyser to detect contract violations.

:   **Use case:** Integration with external tools that perform trace collection separately from Revizor.


## <a name="generate"></a> `generate`

=== "Syntax"
```bash
$ rvzr generate [OPTIONS]
```
:   Generates test cases without execution. Outputs test programs and inputs to them.

:   **Use case:** Integration with external tools that use Revizor's test case generation capabilities.


## <a name="download_spec"></a> `download_spec`

=== "Syntax"
```bash
$ rvzr download_spec [OPTIONS]
```
:   This mode is only used when Revizor is being set up. Downloads, parses, and stores instruction set specifications in JSON format.

:   **Use case:** Tool installation and ISA specification management.


## What's Next?

* [Command Line Interface](cli.md) - How to run Revizor in different modes
* [Minimization Passes](minimization-passes.md) - Available passes for the `minimize` mode


================================================
FILE: docs/ref/papers.md
================================================
# Research Papers

Revizor is a result of extensive academic research in the field of hardware security and microarchitectural side-channel analysis. Below is a list of key research papers related to Revizor, its underlying concepts, and methodologies:


=== "Main Papers"

    If you use Revizor in your research or work, please consider citing some of the following papers:

    * Original paper that introduced the concept of Model-based Relation Testing as well as the Revizor tool:

        > Oleksii Oleksenko, Christof Fetzer, Boris Köpf, Mark Silberstein. "[Revizor: Testing Black-box CPUs against Speculation Contracts](https://www.microsoft.com/en-us/research/publication/revizor-testing-black-box-cpus-against-speculation-contracts/)" in Proceedings of the 27th ACM International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS), 2022.

    * Theoretical foundations of leakage contract:

        > Marco Guarnieri, Boris Köpf, Jan Reineke, and Pepe Vila. "[Hardware-software contracts for secure speculation](https://www.microsoft.com/en-us/research/publication/hardware-software-contracts-for-secure-speculation/)" in Proceedings of the 2021 IEEE Symposium on Security and Privacy (S&P), 2021.

=== "Extensions to Revizor"

    The following papers present significant extensions and improvements to Revizor:

     * Paper that introduced speculation filtering, observation filtering, and contract-based input generation:

        > Oleksii Oleksenko, Marco Guarnieri, Boris Köpf, and Mark Silberstein. "[Hide and Seek with Spectres: Efficient discovery of speculative information leaks with random testing](https://www.microsoft.com/en-us/research/publication/hide-and-seek-with-spectres-efficient-discovery-of-speculative-information-leaks-with-random-testing/)" in Proceedings of the 2023 IEEE Symposium on Security and Privacy (SP), 2022.

    * Paper that introduced exception-based testing (i.e., focus on Meltdown, Foreshadow) into Revizor:

        > Jana Hofmann, Emanuele Vannacci, Cédric Fournet, Boris Köpf, and Oleksii Oleksenko. "[Speculation at Fault: Modeling and Testing Microarchitectural Leakage of CPU Exceptions.](https://www.usenix.org/conference/usenixsecurity23/presentation/hofmann)" in Proceedings of 32nd USENIX Security Symposium (USENIX Security), 2023.

    * Paper that introduced testing of cross-VM and user-kernel leaks in Revizor, as well as presented TSA attacks on AMD CPUs:

        > Oleksii Oleksenko, Flavien Solt, Cédric Fournet, Jana Hofmann, Boris Köpf, Stavros Volos. "[Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://www.microsoft.com/en-us/research/wp-content/uploads/2025/07/Enter-Exit-SP26.pdf)" in Proceedings of the 2026 IEEE Symposium on Security and Privacy (SP), 2026.

=== "Using Revizor"

    The following papers present case studies and practical applications of (parts of) Revizor:

    * **AMuLet, 2025**: Ported Revizor to test Gem5 models of secure speculation mechanisms

        > Bo Fu, Leo Tenenbaum, David Adler, Assaf Klein, Arpit Gogia, Alaa R. Alameldeen, Marco Guarnieri, Mark Silberstein, Oleksii Oleksenko, and Gururaj Saileshwar. "[AMuLeT: Automated Design-Time Testing of Secure Speculation Countermeasures](https://arxiv.org/pdf/2503.00145)". In Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2 (ASPLOS '25). Association for Computing Machinery, New York, NY, USA, 32–47. https://doi.org/10.1145/3676641.3716247

    * **LmTest, 2024**: Used a modified version of Revizor's leakage model to test cryptographic libraries against speculation contracts

        > Gilles Barthe, Marcel Böhme, Sunjay Cauligi, Chitchanok Chuengsatiansup, Daniel Genkin, Marco Guarnieri, David Mateos Romero, Peter Schwabe, David Wu, and Yuval Yarom. 2024. Testing Side-channel Security of Cryptographic Implementations against Future Microarchitectures. In Proceedings of the 2024 on ACM SIGSAC Conference on Computer and Communications Security (CCS '24). Association for Computing Machinery, New York, NY, USA, 1076–1090. https://doi.org/10.1145/3658644.3670319


================================================
FILE: docs/ref/registers.md
================================================
# Register Allocation

The test cases are executed in a sandboxed environment, where some of the registers are reserved for internal use, and some are available for use in the test cases.
Below is a list of registers and their purpose.

!!! info "Advanced Topic"
    This is an advanced topic describing internal implementation details of Revizor. You are unlikely to need this information unless you are extending or modifying Revizor's core components.

####`R15`

Contains the base address of the UTILITY area in the [sandbox](sandbox.md).

If the test case does not enter a VM, the register value remains constant during the execution of the test cases.
Otherwise, the register value is updated to point to the UTILITY area of the currently active VM when the `switch_h2g` macro is called, and it is restored to the original value when the `switch_g2h` macro is called.

The register is used by internal functions, such as the implementation of Prime+Probe.

####`R14`

Contains the base address of the current actor's [sandbox](sandbox.md) (namely, it points to the base of the actor's MAIN area).

At the beginning of the test case execution, the register is set to the base address of the MAIN area of the first actor (actor `main`). The register value is updated to point to the MAIN area of the currently active actor when a macro from the `landing_*` group of macros is called. It is also updated by the `fault_handler` macro.

The register is used in test cases as a part of the sandboxing mechanism.
For example, all generated memory accesses are relative to the value stored in `R14`, and have the form of `[R14 + offset]`.


####`R13` (`HTRACE_REGISTER` constant in the kernel module)

Contains either intermediate or final result of the hardware trace measurements.

Before entering the test case, the register is set to 0.
When a `measurement_start` macro is executed, the register is (optionally) set to the starting value,
such a initial reading of time stamp counter when the `TSC` mode is used.
When a `measurement_end` macro is executed, the register is updated with the final value of the measurement and contains the resulting hardware trace.

####`R12` (`STATUS_REGISTER` constant in the kernel module)

Contains a compressed status of the test case execution:

Bits[0:7] contain a measurement status.
At the beginning of the test case execution, the bits are set to 0.
When `measurement_start` macro is executed, the bits are set to 1.
When `measurement_end` macro is executed, the bits are set to 2.
If the measurement status is not 2 at the end of the test case execution, the kernel module will report an error.

Bits[8:31] are unused.

Bits[32:63] contain a counter of SMI (System Management Interrupt) events.
The counter is set automatically before entering the test case (`READ_SMI_START`), and updated when the test case finishes (`READ_SMI_END`).
If the difference between the readings is not 0, the kernel module will report an error.

####`R11`

The register is used as a temporary buffer by some of the macros.

Before entering the test case, the register is set to 0.
When certain macros are executed (e.g., `set_k2u_target`), the register will contain temporary values.
The register should not be used in the test case, as the temporary value may be consumed by latter macros.

####`R10, R9, R8`

Stores the values of performance counters.
`R10` stores the value of performance counter #1, `R9` stores the value of performance counter #2, and `R8` stores the value of performance counter #3.

Before entering the test case, the registers are set to 0.
When a `measurement_start` macro is executed, the registers are (optionally) set to the starting values.
When a `measurement_end` macro is executed, the registers are updated with the final values of the measurements.


####Other General Purpose Registers

The remaining registers (`rax`, `rcx`, `rdx`, `rsi`, `rdi`, `rflags`) are available for use in the test cases and can be modified freely.
A special case are `rsp` and `rbp`, which can be used in the test cases, but their values must always remain within the sandbox (see [Sandbox](sandbox.md)).

####Vector Registers

Vector registers (`xmm0`-`xmm15`) are also available for use in the test cases.
However, only `xmm0-xmm7` are initialized with input-based values, and the remaining registers are always zero-initialized.

Large-size vector registers (`ymm` and `zmm`) are not supported.


================================================
FILE: docs/ref/runtime-statistic.md
================================================
# Fuzzing Statistics

This document provides a complete reference on how to interpret the runtime statistics output of Revizor. These statistics are generated during fuzzing campaigns and provide insights into the performance and behavior of the fuzzer.

The runtime statistics are essentially printed twice: once during the fuzzing campaign, in a form of a continuously-updated progress log, and once at the end of the campaign, in a summarized report. The statistics in both places have the same meaning, but the final report includes cumulative totals for the entire campaign.

## Runtime Statistics Fields

A typical runtime statistics output looks like this:

```
17    ( 2%)| Stats: Cls:100/100,In:200,R:7,SF:10,OF:7,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0,V:0> Priming  27
```

This line is continuously updated on each iteration of the fuzzer (after each test case is executed).

The fields are as follows:

* `17    ( 2%)` - The current test case number and progress towards the total number of test cases.
* `Cls:100/100` - The average number of unique equivalence classes per test case. The left number is number of "effective" classes (those that have at least two hardware inputs), while the right number is total classes observed. In a well-functioning campaign, these numbers should be equal. See [contract equivalence class](../glossary.md#contract-equivalence-class) in the glossary.
* `In:200` - The number of inputs per test case. Normally, this number is equal to `-i` parameter passed times `inputs_per_class` configuration option.
* `R:7` - Average number of hardware tracing samples per input. See [Trace Analysis - Statistical Comparison](../topics/trace-analysis.md) for more details.
* `SF:10,OF:7,Fst:0,CN:0,CT:0,P1:0,CS:0,P2:0` - The number of test cases that have been filtered by each stage of the false-positive elimination pipeline.
    * `SF` - Number of test cases filtered by the speculation filter.
    * `OF` - Number of test cases filtered by the observation filter.
    * `Fst` - Number of test cases filtered after fast-path execution.
    * `CN` - Number of test cases filtered out when model nesting was increased from 1 (fast path) to `max_model_nesting`.
    * `CT` - Number of test cases that had taint mistakes.
    * `P1` - Number of test cases filtered out by priming stage with the minimal sample size.
    * `CS` - Number of test cases filtered out when the sample size was increased to a non-minimal value.
    * `P2` - Number of test cases filtered out by priming stage with the non-minimal sample size.
* `V:0` - The number of detected violations so far (can be non-zero when running with `--nonstop` flag).
* `Priming  27             ` - Current stage of the false-positive elimination pipeline.

## Final Summary Report

A typical final summary report looks like this:

```
================================ Statistics ===================================

Test Cases: 18
Inputs per test case: 200.0
Violations: 1
Effectiveness:
  Total Cls: 98.0
  Effective Cls: 98.0
Discarded Test Cases:
  Speculation Filter: 10
  Observation Filter: 7
  Fast Path: 0
  Max Nesting Check: 0
  Tainting Check: 0
  Early Priming Check: 0
  Large Sample Check: 0
  Priming Check: 0

Duration: 40.5
Finished at 15:40:23
```

This section summarizes overall statistics from the fuzzing campaign. The fields are similar to those explained in the runtime output section above:

* `Test Cases` - Total number of test cases executed during the campaign.
* `Inputs per test case` - Average number of inputs executed per test case.
* `Violations` - Total number of violations detected during the campaign (may >1 when running with `--nonstop` flag).
* `Effectiveness` - The average number of unique equivalence classes per test case. `Total Cls` is number of "effective" classes (those that have at least two hardware inputs), while `Effective Cls` is total classes observed. In a well-functioning campaign, these numbers should be equal. See [contract equivalence class](../glossary.md#contract-equivalence-class) in the glossary.
* `Discarded Test Cases` - The number of test cases that have been filtered by each stage of the false-positive elimination pipeline.
* `Duration` - Total duration of the fuzzing campaign in seconds.
* `Finished at` - Timestamp when the fuzzing campaign completed.


================================================
FILE: docs/ref/sandbox.md
================================================
# Test Case Sandbox

This document describes the isolated environment for executing test cases, which is referred to as the *sandbox*. The sandbox contains the test case code and data, and the test case code is confined to access memory only within the sandbox.

The sandbox is implemented by all modules that execute test cases, including the executor (kernel module) and all model backends (Unicorn, DynamoRIO).
To ensure that the executions are consistent across all modules, the sandbox is structured in the same way in all the modules.

This document describes the memory layout of the sandbox, the initialization of the sandbox memory, and the fault isolation mechanism.

## Memory Layout

The sandbox memory is divided into two main areas: the data sandbox and the code sandbox.
Each actor in the test case has its own sub-area for its data and code, and the layout of these areas is the same for all actors.

### Data Layout

The data area of a test case in a sandbox is organized as follows:


| Offset | Actor ID | Area Name     | Size, B |
| ------ | -------- | ------------- | ------- |
| 0x0    | ACTOR 0  | Macro Stack   | 0x40    |
| 0x40   |          | Underflow Pad | 0xfc0   |
| 0x1000 |          | Main Area     | 0x1000  |
| 0x2000 |          | Faulty Area   | 0x1000  |
| 0x3000 |          | GPR Area      | 0x40    |
| 0x3040 |          | SIMD Area     | 0x100   |
| 0x3140 |          | Overflow Pad  | 0xec0   |
| 0x4000 | ACTOR 1  | Macro Stack   | 0x40    |
| 0x4040 |          | Underflow Pad | 0xfc0   |
| 0x5000 |          | Main Area     | 0x1000  |
| 0x6000 |          | Faulty Area   | 0x1000  |
| 0x7000 |          | GPR Area      | 0x40    |
| 0x7040 |          | SIMD Area     | 0x100   |
| 0x7140 |          | Overflow Pad  | 0xec0   |
| ...    | ...      | ...           | ...     |


The data area is divided into the following regions:

* **Main and Faulty Areas**: These are the two regions of memory that are accessible by the test case code.
  This is enforced by the test case generator, which instruments all memory accesses to ensure that they fall within these regions (see [code-generation](../internals/architecture/code.md) for more details).
  Both areas are initialized with the input data from the [RBDF](binary-formats.md).
  The main area always has default permissions (RW), while the faulty area has permissions can be configured to cause a fault when accessed.
  This configuration originates from the [config file](config.md).
* **GPR and SIMD Areas**: These regions store the values that will be used by the modules to initialize the general-purpose registers (GPR) and SIMD registers before executing the test case and when switching between actors. Both areas are initialized with the input data from the [RBDF](binary-formats.md).
  The order of registers is: `rax`, `rbx`, `rcx`, `rdx`, `rsi`, `rdi`, `flags`, `rsp` for GPRs, and `xmm0` to `xmm7` for SIMD registers.
* **Over- and Underflow Pads**: These two zero-initialized regions surround the actors' data areas, and their purpose is to determinize the hardware traces on the executor.
  Namely, they are needed for the cases when the CPU speculatively bypasses the sandboxing instrumentation inserted by the test case generator, and the bypass leads to an out-of-bounds memory access.
  As the pads are zero-initialized, the bypassed memory accesses will produce deterministic results.
* **Macro stack**: This region is used to implement complex macros (e.g., VMENTER) that need to save and restore data on the stack with a guarantee that this data won't be corrupted by the following (randomly-generated) instructions (see [macros](macros.md) for more details.)

### Code Layout

The code area of a test case in a sandbox is organized as follows:

| Offset | Actor ID | Area Name       | Size, B |
| ------ | -------- | --------------- | ------- |
| 0x0    | ACTOR 0  | Main Code Area  | 0x2000  |
| 0x2000 |          | Macro Code Area | 0x1000  |
| 0x3000 | ACTOR 1  | Main Code Area  | 0x2000  |
| 0x5000 |          | Macro Code Area | 0x1000  |
| ...    | ...      | ...             | ...     |

The code area is divided into two regions:

* **Main Code Area**: This region contains the binary of the actor's code.
  The code comes from the [RCDF](binary-formats.md) file.
  The first instruction in the code area of actor 0 is the entry point of the test case, and the last instruction of actor 0 is the exit point of the test case.
* **Macro Code Area**: This region contains code of the expanded macros for each actor.
  (see [macros](macros.md) for more details on the macro expansion process.)

### References

* Executor: [rvzr/executor_km/include/sandbox_manager.h](https://github.com/microsoft/side-channel-fuzzer/tree/main/rvzr/executor_km/include/sandbox_manager.h)
* Unicorn backend: [rvzr/sandbox.py](https://github.com/microsoft/side-channel-fuzzer/tree/main/rvzr/sandbox.py)

## Sandbox Initialization

The sandbox is initialized based on the test case code (normally in RCBD format) and the input data (normally in RDBF format).
The following diagram shows the mapping between the RCBF/RDBF files and the sandbox memory layout:

```plaintext
                                        |--------------------|
                   zero initialized ->  | MACRO STACK        |
                                        |--------------------|
                   zero initialized ->  | UNDERFLOW PAD      |
                                        |--------------------|
      RDBF.data[actor_id].main_area ->  | MAIN AREA          |
                                        |--------------------|
    RDBF.data[actor_id].faulty_area ->  | FAULTY AREA        |
                                        |--------------------|
RDBF.data[actor_id].reg_init_region ->  | GPR AREA           |
                                        |--------------------|
RDBF.data[actor_id].reg_init_region ->  | SIMD AREA          |
                                        |--------------------|
                   zero initialized ->  | OVERFLOW PAD       |
                                        |--------------------|


     RCBF.tc_section[actor_id].code ->  | MAIN CODE AREA     |
                                        |--------------------|
     expanded macro code (executor) ->  | MACRO CODE AREA    |
```

## Fault Isolation

UNDER CONSTRUCTION


================================================
FILE: docs/structure.md
================================================
# Revizor Documentation

Everything you need to know about using, understanding, and contributing to Revizor.

## First Steps

Are you new to Revizor? Start here:

* [Revizor at a Glance](intro/01-overview.md): Understand what Revizor is, what problems it solves, and see a quick example of violation detection.
* [Installation Guide](intro/02-install.md): Get Revizor installed on your system and verify your setup.
* [Your First Fuzzing Campaign](intro/tutorials/01-first-fuzz.md): Follow a hands-on tutorial that walks you through running your first test, detecting a violation, and understanding the results.
* [Core Concepts](intro/03-primer.md): Learn about contracts, traces, speculation, and other fundamental concepts needed to use Revizor effectively.
* [Glossary](glossary.md): A quick reference for key terms used throughout the documentation.

---

## Getting Help

Stuck? Need clarification? Here's where to get help.

* [FAQ](faq/general.md) - What is Revizor? How does it work? What's a contract?
* [GitHub Discussions](https://github.com/microsoft/side-channel-fuzzer/discussions) - Ask questions, share experiences, discuss ideas
* [GitHub Issues](https://github.com/microsoft/side-channel-fuzzer/issues) - Report bugs or request features
* [Contributing Guide](https://github.com/microsoft/side-channel-fuzzer/blob/main/CONTRIBUTING.md) - Help improve Revizor
* [Zulip Chat](https://rvzr.zulipchat.com/) - Real-time community support

---

## How the Documentation is Organized

Revizor's documentation is organized into five distinct categories based on your needs:

### Learning-Oriented: Tutorials

Tutorials take you by the hand through a series of steps to complete a project. They are designed for newcomers who want to get started with Revizor. Start here if you're learning.

* [Main Tutorial Series](intro/04-tutorials.md): Follow a series of hands-on tutorials that walk you through running your first tests, detecting violations, and rump up all the way to root-cause analysis and design of custom campaigns.
* [How TSA-SQ Was Detected](intro/tutorials/tsa-sq.md): A practical case study showing how Revizor was used to discover the TSA-SQ vulnerability. For those interested in how Revizor is used in the real world.

---

### Task-Oriented: How-To Guides

How-to guides are recipes that guide you through steps to solve specific problems. They assume you have basic knowledge and want to accomplish something particular.

* [How to Choose a Contract](howto/choose-contract.md) - Select appropriate reference model
* [How to Design a Fuzzing Campaign](howto/design-campaign.md) - Plan effective testing strategies
* [How to Interpret Results](howto/interpret-results.md) - Understand what the outputs mean
* [How to Minimize Violations](howto/minimize.md) - Reduce test cases to essentials
* [How to Root-Cause a Violation](howto/root-cause-a-violation.md) - Analyze and understand detected leaks
* [How to Use Macros](howto/use-macros.md) - Leverage macros for customizing test cases
* [How to Use Templates](howto/use-templates.md) - Create structured test cases with templates

---

### Understanding-Oriented: Topic Guides

Topic guides provide background and explanation to help you understand how Revizor works. They don't contain step-by-step instructions but explain key concepts in depth.

* [Leakage Contracts](topics/contracts.md) - Understanding security specifications
* [Actors and Isolation](topics/actors.md) - Multi-domain testing concepts
* [Leakage Models](topics/models.md) - How the model predicts CPU behavior
* [Test Case Generation](topics/test-case-generation.md) - Code and data generation explained
* [Trace Analysis](topics/trace-analysis.md) - How violations are detected

---

### Information-Oriented: Reference

Reference guides contain technical descriptions of Revizor's components. They're like a dictionary—useful when you know what you're looking for.

* [Command Line Interface](ref/cli.md) - Complete CLI reference
* [Configuration Options](ref/config.md) - All configuration parameters
* [Execution Modes](ref/modes.md) - Fuzz, reproduce, analyze, minimize
* [Macros Reference](ref/macros.md) - Template macro system
* [Minimization Passes](ref/minimization-passes.md) - Available minimization techniques
* [Runtime Statistics](ref/runtime-statistic.md) - Runtime metrics printed during execution
* [Binary Format](ref/binary-formats.md) - (advanced) Revizor's custom binary format
* [Allocated Registers](ref/registers.md) - (advanced) Register allocation details
* [Sandbox](ref/sandbox.md) - (advanced) Sandbox for executing test cases

---

### Contributor-Oriented: Development Guides

Development guides help contributors understand the codebase, architecture, and development practices.

* [Developer Index](internals/index.md)
* [Architecture Overview](internals/architecture/overview.md)
* [Code Style Guidelines](internals/contributing/code-style.md)
* [Git Conventions](internals/contributing/git.md)

---

## Research and Background

Revizor is built on peer-reviewed research in hardware security and formal methods. All papers related to Revizor are listed in the [Research Papers](ref/papers.md) section.

---

## Documentation Feedback

If you find errors, confusing explanations, or missing information in the documentation, please let us know:

* Open an issue with the "documentation" label
* Suggest improvements via pull request
* Discuss on GitHub Discussions


================================================
FILE: docs/stylesheets/extra.css
================================================
/* Custom styles for mkdocs-material */

/* Inline box for default values and highlighted inline content */
.inline-box {
    background-color: var(--md-code-bg-color);
    border: 1px solid var(--md-default-fg-color--lightest);
    padding: 2px 6px;
    border-radius: 2px;
    display: inline-block;
}


================================================
FILE: docs/topics/actors.md
================================================
# Actors

Actors represent distinct security domains within a test case. They could be thought as sub-test-cases, each with its own code, data, execution context, and privilege level.

The main use case for actors is to test interactions and isolation boundaries between security domains. A typical example would be testing kernel-to-user isolation by defining a two-actor test case: one actor runs in kernel mode (the "main" actor), and the other runs in user mode (the "user" actor). The user actor attempts to observe information about the main actor's execution, simulating an attacker trying to leak sensitive kernel data.

By using this mechanism, Revizor can stress-test isolation boundaries by executing lots of randomly generated code on both sides of the boundary and checking for secret-dependent observations on the attacker side.
This mechanism discovered several critical vulnerabilities in production CPUs, most notably Transient Scheduler Attacks in AMD processors, and enables testing of mitigations for Meltdown, Foreshadow, and MDS.

## What is an Actor?

An actor consists of three components:

- Code region associated with a specific execution context
- Private data memory with configurable permissions and properties
- Execution context defined by CPU mode (host/guest), privilege level (kernel/user), and system configuration

Every test case starts with a default actor called `main` that runs in host kernel mode. This actor can transition to other actors using dedicated `switch_*` macros.

## Actor Configuration

Actors are defined in the configuration file under the `actors` section:

```yaml
actors:
  - main:                       # Default main actor
    - mode: "host"              # Always host for main;
                                # changing to "guest" will produce an error
    - privilege_level: "kernel" # Always kernel for main;
                                # changing to "user" will produce an error

  - user:                       # Example user-mode actor
    - mode: "host"
    - privilege_level: "user"
    - data_properties:          # Custom page table properties of the faulty page
      - writable: false         # Faulty page of the user actor is read-only
```


!!! note "Related Documentation"
    See the [configuration documentation](../ref/config.md#actor) for a full list of available options.

## Actor Templates

Multi-actor execution requires template-based mode. Templates define actors along with their code and data sections.

Transitions between actors use dedicated macros for setting entry and exit points, switching contexts, and defining landing locations. Macros are available for kernel-user transitions (`.set_k2u_target`, `.switch_k2u`, etc.) and host-guest transitions (`.set_h2g_target`, `.switch_h2g`, etc.).

!!! note "Related Documentation"
    See [Macro Reference](../ref/macros.md#transition-macros) for detailed descriptions of all transition macros.


## Actor Non-Interference Contract

Revizor uses the Actor Non-Interference contract to verify isolation between security domains. The contract designates one or more actors as observers (attackers) and verifies that observer execution does not depend on data from victim actors.

The contract permits leakage of victim memory access addresses and control flow, but prohibits leakage of data values. This design filters cache-based leakage typically considered benign in modern systems while detecting unexpected microarchitectural leaks. Victim actors follow the ct-seq contract, while observers can expose all their own data.

A violation occurs when observer traces depend on victim data beyond permitted address and control-flow information.

!!! note "Additional Reading"
    The Actor Non-Interference contract is explained in detail in the paper called [Enter, Exit, Page Fault, Leak: Testing Isolation Boundaries for Microarchitectural Leaks](https://www.microsoft.com/en-us/research/wp-content/uploads/2025/07/Enter-Exit-SP26.pdf).


## Example Usage

The following example demonstrates kernel-to-user isolation testing with the Actor Non-Interference contract.

Template with kernel and user actors:

```asm
.intel_syntax noprefix

# ---------------- Main (Kernel) Actor ---------
.section .data.main
.function_main_0:
    # Set up user transition
    .macro.set_k2u_target.user.function_user_0:
    .macro.set_u2k_target.main.function_main_1:

    # Generate random kernel code
    .macro.random_instructions.32.0:

    # Transition to user mode
    .macro.switch_k2u.user.0:

.function_main_1:
    .macro.landing_u2k.main_1:
    # Back in kernel, clean up and exit
    nop

.test_case_exit:

# ---------------- User Actor -----------------
.section .data.user
.function_user_0:
    .macro.landing_k2u.user_0:

    # Start measurement in user mode
    .macro.measurement_start:

    # Generate random user code
    .macro.random_instructions.16.1:

    # End measurement
    .macro.measurement_end:

    # Return to kernel
    .macro.switch_u2k.main.0:

```

Configuration file:

```yaml
actors:
  - main:
      mode: host
      privilege_level: kernel
  - user:
      mode: host
      privilege_level: user
      observer: true              # User is the attacker
      data_properties:
        writable: false           # Trigger page faults on writes

contract_observation_clause: load+store+pc
contract_execution_clause: noninterference
```

In this configuration, the user actor attempts to observe information from the kernel (main actor). The contract specifies that the user can observe memory addresses and control flow (load+store+pc) but not data values. Any leakage beyond this triggers a violation.


================================================
FILE: docs/topics/contracts.md
================================================
# Contracts

A speculation contract is a formal specification of known microarchitectural leakage in CPUs.
A contract serves to provide a precise and unambiguous documentation of all known sources of
side-channel leaks on a given CPU (or a family of CPUs). For example, if a contract targets
a modern Intel or AMD CPU, it will typically include a specification of the leaks caused by
cache side channels and by various speculative vulnerabilities such as Spectre and Meltdown.

Contracts emerged as a solution to a fundamental problem: modern CPUs have complex
microarchitectural optimizations that create side channels, but these mechanisms are often
proprietary and poorly documented. Contracts provide a systematic way to reason about these leaks
without requiring complete knowledge of the underlying hardware.

In the context of Revizor, contracts serve as a reference model against which the actual CPU
behavior is compared; any deviation from the contract indicates a previously-unknown
microarchitectural behavior, which may represent a security vulnerability.

## Contract Structure

A speculation contract consists of two types of clauses that together describe the information a
program exposes during execution.

The *observation clause* specifies what data becomes observable for each instruction. For example, a
contract might declare that load and store instructions expose their target addresses. This models
the information an attacker could learn by monitoring a cache-based side channel such as
Prime+Probe. The observation clause captures side effects without specifying the attack mechanism.

The *execution clause* specifies how hardware optimizations affect program execution. For
speculative execution, the clause describes which instructions execute transiently even when they
should not execute architecturally. For instance, the clause might specify that conditional
branches temporarily take the wrong target. The execution clause models optimization behavior
without describing the implementation details.

Contracts intentionally overestimate leakage. Rather than precisely modeling what leaks occur,
contracts capture everything that could potentially leak given the specified hardware behaviors.
This conservative approach ensures that contracts remain valid even when the exact timing or
conditions of leaks are unknown.

## Example Contracts

The `CT-SEQ` contract models a CPU with caching but no speculation. It represents a baseline level
of leakage present in any cached architecture where memory operations leave observable traces but
instructions execute in program order.

Below is a pseudo-code representation of the `CT-SEQ` contract:

``` yaml
CT-SEQ:
  observation_clause:
    load(address)  -> expose(address)
    store(address) -> expose(address)
    * -> none  # all other instructions expose no information
  execution_clause:
    * -> none  # no optimizations; all instructions execute in program order
```

The `CT-COND` contract extends `CT-SEQ` by adding speculative execution of branches. The observation
clause remains the same, but the execution clause permits conditional jumps to mispredict their
targets and speculatively execute wrong-path instructions. This contract models Spectre-style
vulnerabilities where misprediction causes transient execution that leaves observable cache
footprints.

``` yaml
CT-COND:
  observation_clause:
    load(address)  -> expose(address)
    store(address) -> expose(address)
    * -> none
  execution_clause:
    jump.cond(target) ->  # emulate branch misprediction
        jump.inverted_cond(target)
    * -> none
```

More complex contracts can model other optimizations. A contract for exception handling might allow
faulting user-to-kernel loads to transiently return privileged values before the fault
is architecturally recognized, this modelling Meltdown-style vulnerabilities:

``` yaml
CT-MELTDOWN:
  observation_clause:
    load(address)  -> expose(address)
    store(address) -> expose(address)
    * -> none
  execution_clause:
    jump.cond(target) ->
        jump.inverted_cond(target)
    load(address) ->  # transiently return kernel data thus emulating Meltdown
        if (in_user_mode() && is_kernel_address(address)) {
            return load_privileged(address)
        }
    * -> none
```

## Contract Traces

When a program executes according to a contract, it produces a contract trace. The trace is a
sequence of all observations specified by the observation clause during the execution path
determined by the execution clause. For `CT-SEQ`, the trace contains load and store addresses in
program order. For `CT-COND`, the trace includes addresses from speculatively executed instructions
on mispredicted paths.

Contract traces are deterministic and noise-free, unlike actual hardware measurements. This
property makes them suitable as a reference for comparison. A program executed repeatedly with the
same inputs always produces the same contract trace, even though real hardware traces may vary due
to timing effects and concurrent activity.

For example, consider the following program:

``` asm  linenums="1"
# addr1 = 0x100; addr2 = 0x200;
# *addr1 = 1;    *addr2 = 2
load rax, [addr1]  # expose(0x100)
cmp rax, 0         # 1 != 0
je label_zero      # speculatively mispredicted under CT-COND
    load rbx, [addr2]  # expose(0x200) under CT-COND (but not under CT-SEQ)
label_zero:
```

When this program is executed under `CT-SEQ`, only one load occurs (line 3), producing the trace:

```
ctrace_seq = [ mem:0x100 ]
```

However, under `CT-COND`, the mispredicted branch causes the second load (line 6) to execute,
thus producing a trace with two observations:

```
ctrace_cond = [ mem:0x100, mem:0x200 ]
```


## Contract Compliance

A CPU complies with a contract when the information it leaks never exceeds what the contract
permits. More formally, compliance means that whenever two inputs produce identical contract
traces, they must also produce indistinguishable hardware traces given the same initial
microarchitectural state. This definition ensures that an attacker observing hardware cannot learn
more than the contract allows.

Compliance does not require that hardware traces match contract traces exactly. The contract might
expose complete addresses while hardware only leaks cache set indices. The contract might include
data from speculative paths that hardware does not actually execute. These differences are
acceptable as long as the information content of hardware traces does not exceed contract traces.

A violation occurs when two inputs produce identical contract traces but distinguishable hardware
traces. This indicates that hardware leaks information not captured by the contract, revealing an
unexpected microarchitectural behavior. The violating program serves as evidence of a potential
security vulnerability.


## Contract Evolution

Contracts are not static specifications. When Revizor discovers a violation, the user is free to
update the contract to reflect the newly observed behavior. This way a contract serves as a "filter"
that allows us to automatically distinguish between the leaks that we already know about (and thus
aren't interested in detecting) versus the leaks that are genuinely new and that we may want to
investigate further.

Moreover, the process may go both ways: if the hardware behavior is determined to be a bug,
and the vendor issues a patch, the contract may be updated to remove the previously-allowed leakage,
which in turn will allow Revizor to detect regressions if the patch is later undone or
incompletely applied.

This iterative process gradually refines contracts to match actual hardware behavior. Initial
contracts are based on public documentation and known vulnerabilities. Testing reveals gaps where
hardware leaks more than expected. After investigation, either the contract expands or the
hardware receives a patch. Over time, the contract converges toward a complete specification of
the CPU's microarchitectural leakage.

The contract framework also enables testing of proposed mitigations. Before deploying a patch,
vendors can verify its effectiveness by running Revizor with the updated configuration. If
violations persist, the mitigation is incomplete. This proactive approach helps prevent the
deployment of ineffective patches that provide false security.

## What's Next?

* See the [primer](../intro/03-primer.md) for a deeper dive into non-interference and contract-based testing.
* See the [model documentation](models.md) for details on how Revizor implements contracts.


================================================
FILE: docs/topics/models.md
================================================
# Leakage Models

A leakage model is an executable implementation of a speculation contract. The model takes a
program and inputs, executes them according to contract rules, and produces contract traces that
represent the information expected to leak. Models enable automated testing by providing a
reference against which real hardware behavior can be compared.

```mermaid
flowchart LR
    P[Program]
    I[Input 1 ... N]
    M[Model]
    CT[CTrace 1 ... N]

    P --> M
    I --> M
    M --> CT

    style M fill:#e1f5ff,stroke:#333,stroke-width:2px
    style P fill:#ffe1e1,stroke:#333,stroke-width:1px
    style I fill:#ffe1e1,stroke:#333,stroke-width:1px
    style CT fill:#e1ffe1,stroke:#333,stroke-width:1px
```

Models solve a practical problem in security testing. Contracts specify what should leak in
abstract terms, but to test hardware, we need concrete predictions for specific programs. The
model bridges this gap by simulating program execution under contract assumptions and recording
observable effects as they occur.


## Implementing Contracts

A model implements contracts through two specialized components: the Tracer and the Speculator.
These components monitor instruction execution through hook functions and modify behavior according
to contract rules.

```mermaid
flowchart LR
    A0[Start</br>Program</br>Execution] --> A
    A[Next</br>Instruction] -->B{Select Hook}
    B -->|Instruction has</br>observation clause?| D[Tracer]
    B -->|Instruction has</br>execution clause?| E[Speculator]
    B -->|Model in</br>speculative mode?| F[Speculator]
    D -->G[Record</br>observations] --> Z
    E -->H1[Checkpoint]-->H[Emulate</br>speculation] --> I[Enter</br>speculative</br>mode] --> Z
    F -->J{Termination</br>condition</br>met?}
    J -->|Yes| X[Rollback] --> Z
    J -->|No| Z
    Z[Execute</br>Instruction] -->A

    style D fill:#e1ffe1,stroke:#333
    style G fill:#e1ffe1,stroke:#333
    style E fill:#ffe1e1,stroke:#333
    style F fill:#ffe1e1,stroke:#333
    style H1 fill:#ffe1e1,stroke:#333
    style H fill:#ffe1e1,stroke:#333
    style I fill:#ffe1e1,stroke:#333
    style X fill:#fff4e1,stroke:#333
    style Z fill:#e1f5ff,stroke:#333
```

The Tracer implements the observation clause. It monitors execution of each instruction and records
contract-relevant information. When an instruction with a non-trivial observation clause executes,
the model invokes the corresponding Tracer hook. For example, when a load instruction executes
under a contract that exposes memory addresses, the Tracer hook records the target address. The
Tracer accumulates these observations into a contract trace that represents all information exposed
during execution.

The Speculator implements the execution clause. It modifies the behavior of instructions with
non-trivial execution clauses to simulate microarchitectural optimizations. When such an
instruction executes, the model invokes the Speculator hook, which takes a checkpoint of the
program state and modifies the instruction's behavior. This puts the model into speculative mode.
For example, when a conditional branch executes under a contract that permits misprediction, the
Speculator checkpoints the state, flips the branch condition, and continues on the wrong path.

While in speculative mode, the model checks for termination conditions after each instruction. When
a condition is met, such as the speculation window expiring or encountering a serializing
instruction, the model exits speculative mode and rolls back to the most recent checkpoint. This
restores architectural state and resumes correct execution. Speculation can be nested, with one
speculative region triggering another before the first completes. The Speculator manages a stack of
checkpoints to handle nested speculation correctly.

The hook-based architecture allows models to implement contracts without modifying the core
execution engine. Whenever the model executes an instruction, it checks whether the instruction has
non-trivial observation or execution clauses. If observation clauses are present, Tracer hooks are
invoked. If execution clauses are present, Speculator hooks are invoked. The model also calls hooks
to check speculation termination conditions when in speculative mode. This separation of concerns
makes it straightforward to implement different contracts by providing different Tracer and
Speculator implementations.

## Model Backends

Revizor supports two model backends that implement contracts using different techniques. Both
provide the same interface and produce equivalent contract traces, but they differ in
implementation approach and performance characteristics.

The Unicorn backend uses CPU emulation to execute programs. Unicorn is a CPU emulator derived from
QEMU that supports multiple architectures. The model extends Unicorn with hooks that intercept
instruction execution and memory accesses. When an instruction executes, the hook checks whether
the contract requires recording an observation or triggering speculation. For speculation, the
model uses Unicorn's snapshot and restore capabilities to implement checkpoint-rollback.

The DynamoRIO backend uses dynamic binary instrumentation to execute programs. DynamoRIO inserts
instrumentation code directly into the program at runtime. Before each instruction, the model
injects a callback that checks contract rules. For speculation, the model manipulates register
state to simulate wrong-path execution and uses checkpoints to restore architectural state when
speculation ends. Because the program runs natively on the host CPU, execution is faster than
emulation.

The choice between backends involves trade-offs. The DynamoRIO backend is generally preferable as
it offers better performance and it inherently supports all instructions that can be executed on
the host CPU. However, this backend is more recent and may not support all contract features and
platforms as robustly as the Unicorn backend. Therefore, the Unicorn backend remains available for
use cases where the DynamoRIO backend is not yet suitable.

## Trace Representation

Contract traces are sequences of typed observations. Each observation records one piece of
information that leaked during execution. The trace preserves the order in which observations
occurred, capturing temporal aspects of information flow (although this could be overridden by
the Tracer if the contract prescribes so).

An observation has a type and a value. Types include memory addresses, branch targets, load/store
values, register contents, or any other observable information. The contract determines which types
appear in traces. CT-SEQ traces contain only memory addresses and branch targets. A contract
modeling MDS might include data values. The type system allows precise specification of what
information the contract permits.

## Accuracy and Limitations

Models approximate real hardware behavior, and this approximation introduces both capabilities and
limitations. Understanding these boundaries is important for interpreting test results.

Models implement contracts conservatively but not precisely. The contract specifies bounds on
leakage, and the model respects these bounds while making implementation choices. For branch
speculation, the contract might say branches can mispredict, but not specify when or how often. A
model that speculatively executes every branch overapproximates reality but remains consistent
with the contract. This conservatism means models may predict leakage that never occurs, but they
should not miss leakage that does occur.

Instruction support varies between backends and real hardware. Some instructions are complex or
poorly documented, making them difficult to emulate correctly. Unicorn covers most common
instructions but may have gaps or emulation bugs. When the model encounters unsupported
instructions, it typically halts with an error. This conservative behavior prevents incorrect
predictions but limits which test cases can be executed.

Models do not aim to capture all microarchitectural details. Real CPUs have dozens of optimizations
including out-of-order execution, store buffers, prefetchers, and speculative memory
disambiguation. Contracts and models abstract away most of these details and focus instead on
the information observable through side channels, rather than trying to describe the mechanisms
that produce the leakage. This abstraction simplifies model implementation and focuses testing on
the most relevant aspects.

## Performance Considerations

Model performance directly affects testing throughput. Revizor must execute thousands or millions
of test cases to achieve good coverage, and model execution dominates the time budget. Faster
models enable more comprehensive testing within a given time frame.

The highest impact on performance comes from the complexity of the execution clause in the contract.
Simple contracts with minimal speculation (e.g., `CT-SEQ`) execute quickly, while contracts with
extensive speculation incur significant overhead due to increase in the number of executed
instructions.

Backend choice also impacts performance. DynamoRIO typically outperforms Unicorn, especially for
larger test cases or when executing with many inputs per test case (> 100s). However, DynamoRIO
has a higher startup overhead, making it less efficient for very small test cases or when
executing with few inputs per test case (< 10s). The performance crossover point depends on
the specific fuzzing scenario.

## What's Next?

* See the [contracts documentation](contracts.md) for details on contract specifications.
* See the [internals documentation](../internals/architecture/model.md) for implementation details.
* See [Unicorn backend](../internals/model-backends/model-unicorn.md) and [DynamoRIO backend](../internals/model-backends/model-dr.md) for backend-specific information.


================================================
FILE: docs/topics/test-case-generation.md
================================================
# Test Case Generation

[Test case](../glossary.md#test-case-program) generation is the process of creating executable programs that probe CPU microarchitectural behavior. Revizor generates test cases either randomly or from user-defined templates, then instruments them to prevent unwanted faults, and finally compiles them into binaries suitable for execution. The test cases serve as inputs to both the leakage model and the hardware executor, enabling comparison of expected and observed microarchitectural behavior.

The generator must balance two competing requirements. First, it needs to produce diverse test cases that explore many different microarchitectural conditions and instruction sequences. This diversity is essential for thorough coverage of the CPU's behavior space. Second, when testing specific scenarios like domain transitions or mitigation effectiveness, it must generate programs with precise structures while still varying the surrounding context. This balance distinguishes Revizor's approach from simple random testing.

## Generation Modes

Revizor supports two distinct modes of test case generation, each suited to different testing scenarios.

Random generation creates test cases from scratch without any predefined structure. The generator builds a program by selecting instructions randomly from a configured pool, creating control flow by inserting conditional and unconditional branches, and allocating memory accesses to random addresses. This mode maximizes exploration of the instruction space and frequently discovers unexpected interactions between instructions. Random generation excels at finding vulnerabilities in single execution domains where no specific instruction sequence is required. However, it struggles with scenarios requiring precise setup, such as triggering specific page faults or transitioning between security domains.

Template-based generation starts from a user-written assembly file that defines the overall structure of the test case. The template specifies where random code should be inserted, which domain transitions to perform, and how [actors](../glossary.md#actor) should interact. The generator parses the template, expands special macros that mark randomization points, fills those points with random instructions, and instruments the result. Templates enable testing of specific scenarios while maintaining randomization where it matters. For example, a template can ensure that a kernel-to-user transition occurs at a specific point while randomizing the instructions executed in each domain.

The distinction matters because microarchitectural vulnerabilities often depend on precise conditions. Consider testing whether a CPU leaks kernel data to user space. Random generation might occasionally produce programs that transition to user mode, but the probability is low and the surrounding context may not trigger the vulnerability. A [template](../glossary.md#template) guarantees the transition occurs and controls the operations performed before and after it, dramatically increasing the likelihood of discovering leakage.

## Instrumentation Passes

Generated test cases, whether random or template-based, are not immediately ready for execution. They may contain instruction sequences that trigger unwanted faults, use undefined register values, or violate architectural constraints. Instrumentation passes transform test cases into safe, executable forms while preserving the properties being tested.

Instrumentation operates on the [structured representation of test cases](#test-case-structure). Each pass implements a specific transformation by walking the instruction hierarchy and modifying it according to its rules. Passes run in sequence, with each pass seeing the output of previous passes. This pipeline architecture allows complex transformations to be built from simple components.

One critical example of a pass is the sandboxing pass, which instruments memory accesses to ensure they target valid addresses within the test case's allocated memory. Accesses to unmapped addresses cause page faults. While some test cases intentionally trigger faults, most do not, and random generation can easily produce invalid addresses. The pass analyzes memory operands, identifies potentially invalid accesses, and masks the instruction operands to bound them within the sandbox.

Another example is a pass that prevents division by zero. Divisions by zero and division overflows trigger exceptions on x86-64, which may be undesirable in a fuzzing campaign that does not focus on this specific type of exception. Yet random generator will commonly trigger them, especially the division overflows. This pass mitigates this issue by scanning the instruction stream for division instructions, and it instruments the division operands to ensure they are non-zero and within safe ranges.

The passes are designed to introduce minimal microarchitectural side effects, to avoid interfering with the properties being tested. For example, the instrumentation code primarily uses arithmetic and logical operations that do not have any known speculative effects, and the instructions operate primarily on registers rather than memory. This careful design ensures that the instrumentation does not inadvertently create or mask vulnerabilities (or at least minimizes the chances of doing so).

## <a name="test-case-structure"></a> Test Case Structure

A test case is represented internally as a hierarchy of nested components. The following diagram illustrates this hierarchical structure:

```mermaid
graph TD
    TC[TestCaseProgram]
    TC --> CS1[CodeSection: main]
    TC --> CS2[CodeSection: user]

    CS1 --> F1[Function: .function_0]
    CS2 --> F2[Function: .function_user_0]

    F1 --> BB1[BasicBlock: entry]
    F1 --> BB2[BasicBlock: .label_1]
    F1 --> BB3[BasicBlock: exit]

    BB1 --> I1[Instruction: mov rax, rbx]
    BB1 --> I2[Instruction: add rax, 1]
    BB1 --> T1[Terminator: jmp .label_1]

    BB2 --> I3[Instruction: ...]
    BB2 --> T2[Terminator: ret]

    F2 --> BB4[BasicBlock: entry]
    BB4 --> I4[Instruction: ...]

    style TC fill:#e1f5ff
    style CS1 fill:#ffe1e1
    style CS2 fill:#ffe1e1
    style F1 fill:#fff4e1
    style F2 fill:#fff4e1
    style BB1 fill:#e1ffe1
    style BB2 fill:#e1ffe1
    style BB3 fill:#e1ffe1
    style BB4 fill:#e1ffe1
```

At the top level, a TestCaseProgram contains one or more CodeSections. Each CodeSection belongs to a single Actor and holds the code that executes in that actor's context. In single-actor fuzzing, only one section exists. In multi-actor testing, each actor gets its own section with its own code and data.

Within each CodeSection, code is organized into Functions. A Function consists of multiple BasicBlocks connected by control flow. The first block is the entry point, and execution proceeds through the blocks following branches and jumps. This structure mirrors conventional compiler intermediate representations, making it straightforward to apply standard analysis and transformation techniques.

Each BasicBlock contains a sequence of Instructions terminated by zero or more control flow instructions. Regular instructions execute sequentially, while terminators (branches, jumps, returns) determine which block executes next. Instructions themselves are high-level representations that capture the operation, operands, and dependencies. They are not raw bytes but structured objects that can be analyzed and modified by instrumentation passes.

This hierarchical design serves several purposes. It allows instrumentation passes to operate at different levels of granularity, from modifying individual instructions to restructuring entire functions. It makes the structure explicit, eliminating the need to repeatedly parse assembly text. It enables efficient copying and modification when expanding templates. Most importantly, it provides a common representation used throughout the fuzzing pipeline, from generation through model execution to hardware measurement.


## Macro Placeholders

[Macro placeholders](../glossary.md#macro) are the key mechanism for combining fixed structure with randomization. They appear in templates as special labels that get expanded during test case generation. A macro looks like an assembly label but carries semantic meaning. For example, `.macro.random_instructions.64:` tells the generator to insert 64 randomly chosen instructions at that point.

```mermaid
graph LR
    subgraph "Template (Before Expansion)"
        T1[".section .main<br/>.function_0:"]
        T2[".macro.random_instructions.3:"]
        T3["mov rax, [rbx]"]
    end

    subgraph "Expanded Test Case"
        E1[".section .main<br/>.function_0:"]
        E2["add rax, rbx"]
        E3["mov [rdi], rcx"]
        E4["cmp rax, 0"]
        E5["mov rax, [rbx]"]
    end

    T1 --> E1
    T2 -.expands to.-> E2
    T2 -.expands to.-> E3
    T2 -.expands to.-> E4
    T3 --> E5

    style T2 fill:#ffe1e1
    style E2 fill:#e1ffe1
    style E3 fill:#e1ffe1
    style E4 fill:#e1ffe1
```

The critical insight is that macros defer decisions. A template author specifies where randomization should occur without specifying the exact instructions. This preserves the ability to test many different instruction sequences while maintaining the overall structure.

Macros also enable progressive refinement of test cases. An initial template might use a single random macro to generate a large instruction sequence. If that discovers a [violation](../glossary.md#violation), the user can refine the template to add more structure around the violation, narrowing the search space. The macro system makes this iteration efficient because templates remain concise and readable.

!!! note "Related Documentation"
    For a complete list of available macros and their specifications, refer to the [Macro Reference](../ref/macros.md).

    For a how-to guide on using macros, see [How-To: Use Macros](../howto/use-macros.md).

## Template Structure and Expansion

```mermaid
flowchart LR
    T[Template File] --> P[Parse Template]
    C[Config File] --> P
    P --> R[Fill Random<br/>Instructions]
    R --> IP[Instrumentation<br/>Passes]
    IP --> PR[Print to<br/>Assembly]
    PR --> AS[Assemble]
    AS --> B[Binary<br/>Test Case]

    style T fill:#e1f5ff
    style C fill:#e1f5ff
    style R fill:#ffe1e1
    style IP fill:#fff4e1
    style B fill:#e1ffe1
```

Templates use standard assembly syntax with macro extensions. This design choice means templates are valid assembly files that can be processed by conventional tools. Comments, labels, directives, and instructions follow normal assembly conventions. Only the macro pseudo-instructions are specific to Revizor.

Template expansion proceeds in several phases. First, the generator parses the template using a standard assembly parser extended to recognize macros. Parsing produces the hierarchical test case structure described earlier, with macros represented as special instruction types. Next, the generator walks the structure and expands the `random_instructions` macro placeholders to random instruction sequences. Finally, instrumentation passes run, the test case is printed back to assembly, and the assembler produces an object file.


!!! note "Related Documentation"
    For detailed instructions on writing and using templates, refer to [How-To: Use Templates](../howto/use-templates.md).

## Generation Performance

Generation performance affects overall fuzzing throughput, although it usually has a low impact on the overall process compared to the executor and the model. Generation may dominate the execution time only in the rare case where the other components are extremely fast, such as when testing very small test cases with a small (<10) number of inputs.

Both random and template-based generation modes have similar performance as the template is re-used across all generation requests after the first expansion.


## What's Next?

- [Configuration Reference](../ref/config.md): Generator configuration options
- [Actors](actors.md): Security domains represented in test cases
- [Binary Formats](../ref/binary-formats.md): File formats for test case binaries
- [How-To: Use Macros](../howto/use-macros.md): Guide on using macros in templates
- [How-To: Use Templates](../howto/use-templates.md): Guide on writing and using templates
- [Code Generation](../internals/architecture/code.md): Implementation details of code generation and instrumentation


================================================
FILE: docs/topics/trace-analysis.md
================================================
# Trace Analysis

This document describes Revizor's trace analysis techniques for detecting microarchitectural
contract violations by comparing contract traces with hardware traces.

Trace analysis is the core mechanism of Model-Based Relational Testing. It compares
[contract traces](../glossary.md#contract-trace) (predicted leakage from the model) with
[hardware traces](../glossary.md#hardware-trace) (observed leakage from real CPU) to detect
microarchitectural [contract violations](../glossary.md#violation).

## Contract Compliance Property

The fundamental property being tested is [contract compliance](../glossary.md#contract-compliance):
if two inputs produce the same contract trace, they must produce the same hardware trace for all
microarchitectural states.

Formally, a CPU complies with a speculation contract if, for all possible programs P, all input pairs (I₁, I₂), and all initial microarchitectural states Ctx:

```
ContractTrace(P, I₁) = ContractTrace(P, I₂)
  ⟹
HardwareTrace(P, I₁, Ctx) = HardwareTrace(P, I₂, Ctx)
```

If this property is violated, the CPU is leaking information beyond what the contract predicts.
A violation indicates that the contract is incomplete or that the CPU has an unexpected side
channel. See the [primer](../intro/03-primer.md#building-and-testing-speculation-contracts) for
theoretical foundations.

Revizor approximates this property by randomly sampling the space of programs, inputs, and microarchitectural states, and checking for violations based on collected traces.
The following sections describe how this check is implemented in practice.

## Problem Statement

The trace analysis task boils down to the following problem:

=== "Given"

:   - A test program P
    - A sequence of inputs I₁ … Iₙ
    - A sequence of contract traces CTrace₁ … CTraceₙ (one per input, produced by the model)
    - A sequence of hardware traces HTrace₁ … HTraceₙ (one per input, produced by the executor)

<div></div> <!-- empty line for spacing -->

=== "Objective"

:    Detect if there exist any input pairs (Iᵢ, Iⱼ) such that
    ```
    CTraceᵢ = CTraceⱼ but HTraceᵢ ≠ HTraceⱼ
    ```

## Deterministic Trace Comparison

To detect contract violations, we need to check the above property for all tested inputs.
Checking each input pair separately would be extremely inefficient (O(N²) complexity). Instead,
we use an equivalence-class-based algorithm that groups inputs by their contract traces and
checks hardware trace consistency within each group:

1. **Bundle measurements**: Create tuples `(Input ID, Input, CTrace, HTrace)` for each execution
2. **Group by contract trace**: Partition measurements into contract equivalence classes where
   all measurements share the same `CTrace`
3. **Check hardware traces**: Within each contract equivalence class, verify all hardware traces
   are identical
4. **Report violations**: If a contract equivalence class contains different hardware traces,
   report a violation

```mermaid
flowchart LR
    B[Bundle measurements]
    B --> C[Group by CTrace<br/>]
    C --> D{For each EqClass}
    D --> E[Compare hardware traces]
    E --> F{All identical?}
    F -->|Yes| G[Mark class OK]
    F -->|No| H[Record violation]
    G --> I{More classes?}
    H --> I
    I -->|Yes| D
    I -->|No| J[End]

    classDef good fill:#c3f3d9,stroke:#2b7b4b,color:#000;
    classDef bad fill:#f9d5d5,stroke:#b61b1b,color:#000;
    class G good
    class H bad

```

=== "Example"

    Suppose we test 4 inputs and get:

    ```
    I0: CTrace=A, HTrace=X
    I1: CTrace=A, HTrace=X
    I2: CTrace=B, HTrace=Y
    I3: CTrace=A, HTrace=Z
    ```

    Contract equivalence classes:

    ```
    - Class [CTrace=A]: I0, I1, I3
    - Class [CTrace=B]: I2
    ```

    Analysis:

    - Class `[CTrace=A]` contains three measurements with HTraces `{X, X, Z}`
    - Since X ≠ Z, this is a **violation**
    - Inputs `I0` and `I1` behaved identically (`HTrace=X`) but input `I3` behaved differently (`HTrace=Z`),
    despite having the same contract trace=A
    - Accordingly, we found a violation: `I0` and `I3` have the same contract trace (`A = A`) while
    the hardware traces differ (`X ≠ Z`)

## Statistical Trace Comparison

### The Problem of Noise

Real hardware measurements are noisy. Even if we execute the same program with the same input
repeatedly, we might get different hardware traces each time, due to factors like timing variations
 in microcode execution, cache state changes from uncontrollable sources, non-controlled
 hardware optimizations, etc.

These discrepancies may cause false positives if we directly use the deterministic algorithm,
because the differences between the hardware traces may be caused by noise, not by genuine
information leakage.

=== "Example"
    Suppose we test only two of the inputs from the previous example, but the second
    measurement produces a slightly different hardware trace due to noise:

    ```
    I0: CTrace=A, HTrace=X
    I1: CTrace=A, HTrace=X'
    ```

    The resulting analysis will produce a false violation:

    - Contract equivalence class `[CTrace=A]: I0, I1`
    - Hardware traces: `{X, X'}`
    - Since `X ≠ X'`, we incorrectly report a violation, even though both inputs are actually safe
    and the difference is just noise.

### Solution: Sampling and Statistical Analysis

To address this, we treat hardware traces as samples from a distribution rather than single
deterministic values. Instead of comparing individual hardware traces, we compare the distributions
of hardware traces produced by each input. This replaces the deterministic equality check
`HardwareTrace(P, I₁, Ctx) = HardwareTrace(P, I₂, Ctx)` with a statistical test that
determines if two samples are drawn from the same distribution.

To implement this, we modify the measurement process: instead of collecting one hardware trace
per input, Revizor collects **multiple samples** per input. Each `HTrace` object contains an
array of measurement samples. For example, with sample size N=10:

```
I0: CTrace=A, HTrace=[X, X, X', X, X, X', X, X, X, X]
I1: CTrace=A, HTrace=[X, X', X, X, X, X, X', X, X, X]
```

Now we must compare **distributions** rather than individual values, and the question becomes: "Are these two samples drawn from the same distribution?"

### Chi-Squared Test for Categorical Data

Hardware traces are categorical data (no natural ordering), so Revizor uses Pearson's χ²
homogeneity test.

Given two samples `t₁` and `t₂` of hardware traces, the test computes:

```
χ² = Σ (obs₁(t) - expected(t))² / expected(t)
   + Σ (obs₂(t) - expected(t))² / expected(t)
```

where:

- `obs₁(t)` = count of trace `t` in sample 1
- `obs₂(t)` = count of trace `t` in sample 2
- `expected(t) = (obs₁(t) + obs₂(t)) / 2` = average count

The χ² statistic is normalized by total sample size to make it comparable across different
sample sizes.

**Decision rule**: If `χ²/N < threshold`, accept that the samples come from the same
distribution (no violation).

The threshold is configurable (default 0.05) and can be tuned based on expected noise levels via [`analyser_stat_threshold`](../ref/config.md#analyser_stat_threshold) config parameter.

The following examples illustrate how the χ² test distinguishes between noise and real violations.

=== "No violation"

    ```
    I0: CTrace=A, HTrace=[X(8 times), X'(2 times)]
    I1: CTrace=A, HTrace=[X(7 times), X'(3 times)]
    ```

    The distributions are similar (mostly X with some noise X'). χ² test will show they're
    equivalent:

    ```
    obs₁(X) = 8, obs₁(X') = 2
    obs₂(X) = 7, obs₂(X') = 3
    expected(X) = (8 + 7) / 2 = 7.5
    expected(X') = (2 + 3) / 2 = 2.5
    χ² = (8 - 7.5)²/7.5 + (2 - 2.5)²/2.5 + (7 - 7.5)²/7.5 + (3 - 2.5)²/2.5
       = 0.2666
    χ²/N = 0.2666/10 = 0.02666
    χ²/N < 0.05 → accept equivalence (no violation)
    ```


=== "Real violation"

    ```
    I0: CTrace=A, HTrace=[X(5 times), X'(1 time), Y(4 times)]
    I1: CTrace=A, HTrace=[X(5 times), X'(1 time), Z(4 times)]
    ```

    The distributions are clearly different (X vs Y). χ² test will reject equivalence → violation:
    ```
    obs₁(X) = 5, obs₁(X') = 1, obs₁(Y) = 4
    obs₂(X) = 5, obs₂(X') = 1, obs₂(Z) = 4
    expected(X) = (5 + 5) / 2 = 5
    expected(X') = (1 + 1) / 2 = 1
    expected(Y) = (4 + 0) / 2 = 2
    expected(Z) = (0 + 4) / 2 = 2
    χ² = (5 - 5)²/5 + (1 - 1)²/1 + (4 - 2)²/2 + (0 - 2)²/2
       + (5 - 5)²/5 + (1 - 1)²/1 + (0 - 2)²/2 + (4 - 2)²/2
       = 8
    χ²/N = 8/10 = 0.8
    χ²/N > 0.05 → reject equivalence (violation)
    ```

### Adaptive Sample Sizing

For performance reasons, Revizor does not immediately use a large sample size. Instead, it
starts with a small sample, collects the traces, and checks if a violation is detected. If no
violation is detected, the executor assumes that the test case is safe, and moves on to the next
one. If a violation is detected, however, the executor tries to reproduce it with larger sample
sizes.

Example adaptive strategy:

``` python
for N in [15, 40, 160, 320]:
    collect N samples per input
    if violation detected:
        continue
    else:
        return "no violation"
return "violation detected"
```

The exact sample sizes and thresholds are configurable via [`executor_sample_sizes`](../ref/config.md#executor_sample_sizes) config parameter.

## What's Next?

- [Configuration Options](../ref/config.md) - Configure analyzer parameters
- [Model-Based Relational Testing](../intro/03-primer.md) - Theoretical foundations
- [Analyser Architecture](../internals/architecture/analysis.md) - Implementation
  details


================================================
FILE: mkdocs.yml
================================================
---
site_name: Revizor
site_url: https://github.com/microsoft/side-channel-fuzzer
site_author: Microsoft
site_description: A security-oriented tool for testing CPUs and detecting microarchitectural leaks like Spectre and Meltdown
copyright: 'Copyright &copy; 2025 Microsoft'

repo_name: microsoft/side-channel-fuzzer
repo_url: https://github.com/microsoft/side-channel-fuzzer

docs_dir: docs

theme:
  name: material
  palette:
    - media: "(prefers-color-scheme: light)"
      scheme: default
      primary: indigo
      accent: indigo
      toggle:
        icon: material/brightness-7
        name: Switch to dark mode
    - media: "(prefers-color-scheme: dark)"
      scheme: slate
      primary: indigo
      accent: indigo
      toggle:
        icon: material/brightness-4
        name: Switch to light mode
  font:
    text: Roboto
    code: Roboto Mono
  features:
    - navigation.instant
    - navigation.tracking
    - navigation.indexes
    - navigation.tabs
    - toc.integrate
    - search.suggest
    - search.highlight
  logo: assets/icon.svg
  favicon: assets/favicon.svg

extra_css:
  - stylesheets/extra.css

plugins:
  - search

markdown_extensions:
  - toc:
      toc_depth: 2

  # diagrams
  - pymdownx.superfences:
      custom_fences:
        - name: mermaid
          class: mermaid
          format: !!python/name:pymdownx.superfences.fence_code_format

  # Better typography and formatting
  - abbr
  - admonition
  - attr_list
  - md_in_html
  - def_list
  - footnotes
  - meta
  - tables
  - pymdownx.caret
  - pymdownx.keys
  - pymdownx.mark
  - pymdownx.details

  # Code highlighting (must be before tabbed)
  - pymdownx.highlight:
      anchor_linenums: true

  - pymdownx.snippets

  # Tabbed content blocks
  - pymdownx.tabbed:
      alternate_style: true
      combine_header_slug: true

  # Other extensions
  - pymdownx.pathconverter
  - pymdownx.tasklist:
      custom_checkbox: true

  # Enhanced formatting
  - pymdownx.betterem:
      smart_enable: all
  - pymdownx.tilde
  - pymdownx.smartsymbols

  - pymdownx.emoji:
      emoji_index: !!python/name:material.extensions.emoji.twemoji
      emoji_generator: !!python/name:material.extensions.emoji.to_svg


nav:
  - Start Here: intro/start-here.md
  - Documentation:
    - Documentation Structure: structure.md
    - Getting Started:
      - Revizor at a Glance: intro/01-overview.md
      - Installation: intro/02-install.md
      - Deep Dive into Concepts: intro/03-primer.md
      - Overview of Tutorials: intro/04-tutorials.md
      - Tutorial 1 - First Campaign: intro/tutorials/01-first-fuzz.md
      - Tutorial 2 - First Vulnerability: intro/tutorials/02-first-vuln.md
      - Tutorial 3 - Testing Faults: intro/tutorials/03-faults.md
      - Tutorial 4 - Testing Isolation: intro/tutorials/04-isolation.md
      - Tutorial 5 - Extending Revizor: intro/tutorials/05-extending.md
      - Extra Tutorial - Detecting TSA-SQ: intro/tutorials/tsa-sq.md
    - How-To Guides:
      - Ask a Question: howto/ask-a-question.md
      - Choose a Contract: howto/choose-contract.md
      - Design a Campaign: howto/design-campaign.md
      - Interpret Output: howto/interpret-results.md
      - Minimize Violations: howto/minimize.md
      - Root-Cause a Violation: howto/root-cause-a-violation.md
      - Use Templates: howto/use-templates.md
      - Use Macros: howto/use-macros.md
    - Topics:
      - Contracts: topics/contracts.md
      - Leakage Models: topics/models.md
      - Trace Analysis: topics/trace-analysis.md
      - Test Case Generation: topics/test-case-generation.md
      - Actors: topics/actors.md
    - Reference:
      - Modes of Operation: ref/modes.md
      - Command Line Interface: ref/cli.md
      - Configuration Options: ref/config.md
      - Runtime Statistics: ref/runtime-statistic.md
      - Minimization Passes: ref/minimization-passes.md
      - Macros: ref/macros.md
      - Artifact File Formats: ref/artifact-file-formats.md
      - Internal Binary Formats: ref/binary-formats.md
      - Registers: ref/registers.md
      - Sandbox: ref/sandbox.md
    - Glossary: glossary.md
    - Academic Research: ref/papers.md
  - FAQ:
    - General Questions: faq/general.md
  - Contribute:
    - Index: internals/index.md
    - Guide to Contributing: internals/contributing/overview.md
    - Guidelines:
      - General Guidelines: internals/contributing/general.md
      - Code Style: internals/contributing/code-style.md
      - Git Workflow: internals/contributing/git.md
    - Code Structure: internals/code-structure.md
    - Architecture:
      - Overview: internals/architecture/overview.md
      - Orchestration: internals/architecture/fuzz.md
      - ISA Specification: internals/architecture/isa.md
      - Test Case Code Generation: internals/architecture/code.md
      - Test Case Data Generation: internals/architecture/data.md
      - Hardware Tracing: internals/architecture/exec.md
      - Contract Tracing: internals/architecture/model.md
      - Trace Analysis: internals/architecture/analysis.md
      - Minimization: internals/architecture/mini.md
      - Logging: internals/architecture/logging.md
    - Model Backends:
      - Unicorn Backend: internals/model-backends/model-unicorn.md
      - DynamoRIO Backend: internals/model-backends/model-dr.md


================================================
FILE: pyproject.toml
================================================
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"

[project]
name = "revizor-fuzzer"
version = "2.0.0"
description = "A fuzzer to search for microarchitectural leaks in CPUs"
readme = "README.md"
requires-python = ">=3.9"
classifiers = [
    "Programming Language :: Python :: 3",
    "Programming Language :: Python :: 3 :: Only",
    "License :: OSI Approved :: MIT License",
    "Operating System :: POSIX :: Linux",
    "Typing :: Typed",
]
dependencies = [
    "unicorn==1.0.3; platform_machine == 'x86_64'",
    "unicorn; platform_machine == 'aarch64'",
    "pyyaml",
    "types-pyyaml",
    "numpy",
    "pyelftools",
    "xxhash",
    "scipy",
    "mypy",
    "pylint",
    "flake8",
    "setuptools<80",  # To avoid deprecation warnings cased by Unicorn
    "cffi",
    "types-cffi",
]
maintainers = [{name = "Oleksii Oleksenko", email = ""}]

[project.urls]
"Homepage" = "https://microsoft.github.io/side-channel-fuzzer/"
"Source code" = "https://github.com/microsoft/side-channel-fuzzer"
"Bug Tracker" = "https://github.com/microsoft/side-channel-fuzzer/issues"
"Changelog" = "https://github.com/microsoft/side-channel-fuzzer/releases"

[tool.hatch.build]
exclude = [
  "demo/",
  "docs/",
  "mkdocs-overrides/",
  "rvzr/executor_km/",
  "tests/",
  "tests/x86_tests/",
  "tests/x86_tests/",
  "base.json",
  "site/",
  "dbg/",
  "revizor.code-workspace",
]

[tool.hatch.build.targets.wheel]
packages = ["rvzr"]

[project.scripts]
rvzr = "rvzr.cli:main"


================================================
FILE: revizor.py
================================================
#!/usr/bin/env python3
"""
File: Command Line Interface to Revizor

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

from rvzr.cli import main

if __name__ == '__main__':
    exit_code = main()
    exit(exit_code)


================================================
FILE: rvzr/__init__.py
================================================
# flake8: noqa
# pylint: skip-file

from .isa_spec import *
from .executor import *
from .analyser import *
from .data_generator import *
from .code_generator import *
from .cli import *
from .logs import *

from .model import *
from .fuzzer import *
from .factory import *
from .config import *

from .asm_parser import *

from .arch.x86 import *
from .model_unicorn import *
from .postprocessing import *

__version__ = "2.0.0"


================================================
FILE: rvzr/analyser.py
================================================
"""
File: various ways to compare collected ctraces with htraces

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from collections import Counter
from typing import List, Dict, TYPE_CHECKING, Union, Final
from abc import ABC, abstractmethod
from scipy import stats  # type: ignore

import numpy.typing as npt
import numpy as np

from .traces import HTrace, CTrace, TraceBundle, Violation, ContractEqClass, HardwareEqClass
from .config import CONF, ConfigException
from .stats import FuzzingStats
from .logs import warning, error

if TYPE_CHECKING:
    from .tc_components.test_case_data import InputData
    from .tc_components.test_case_code import TestCaseProgram

IntArrayLike = Union[List[int], npt.NDArray[np.uint64]]

STAT = FuzzingStats()


# ==================================================================================================
# Abstract Analyser Interface
# ==================================================================================================
class Analyser(ABC):
    """ Interface definition for all analysers """

    @abstractmethod
    def filter_violations(self,
                          ctraces: List[CTrace],
                          htraces: List[HTrace],
                          test_case_code: TestCaseProgram,
                          inputs: List[InputData],
                          stats_: bool = False) -> List[Violation]:
        """
        Compare the provided contract and hardware traces and return a list of contract
        violations, if any are found.
        :param ctraces: a list of contract traces to check
        :param htraces: a list of hardware traces to check
        :param test_case_code: the program under test
        :param inputs: a list of inputs under test (one per trace)
        :param stats_: whether to update the global fuzzing statistics based on the results
        :return: a list of violations, if any are found
        """

    @abstractmethod
    def htraces_are_equivalent(self, htrace1: HTrace, htrace2: HTrace) -> bool:
        """ Compare two hardware traces according to the current analyser's rules.

        :param htrace1: first hardware trace
        :param htrace2: second hardware trace
        :return: True if the traces are equivalent, False otherwise
        """


# ==================================================================================================
# Equivalence class-based Analysers
# ==================================================================================================
class EquivalenceAnalyserCommon(Analyser):
    """
    Abstract class implementing the algorithm that compares contract and hardware traces
    by using the concept of equivalence classes.

    The algorithm check if any of the traces fits the definition of a contract violation,
     which is:
       For two pairs of traces (ctrace1, htrace1) and (ctrace2, htrace2),
       where ctrace1 is a contract trace for input1
       and htrace1 is a hardware trace for input1 (and so on),
       the traces violate the contract if
            ctrace1 == ctrace2 and
            htrace1 NOT EQUIVALENT htrace2

    The definition of EQUIVALENT is specific to the concrete implementation of the analyser
    (see subclasses).
    """

    def filter_violations(self,
                          ctraces: List[CTrace],
                          htraces: List[HTrace],
                          test_case_code: TestCaseProgram,
                          inputs: List[InputData],
                          stats_: bool = False) -> List[Violation]:
        # --------
        # NOTE: This implementation is a common algorithm of checking for contract violations in
        # all equivalence class-based analysers. The subclasses modulate the implementation by
        # defining the htraces_are_equivalent method.
        #
        # The algorithm works by first grouping the measurements by their contract trace (ctrace),
        # and then checking if all hardware traces (htraces) in the same group are equivalent
        # according to the htraces_are_equivalent method. If not, a Violation object is created
        # based on the violating traces, and added to the list of violations.
        #
        # Note that the algorithm also filters out measurements with corrupted/ignored htraces.
        # The filtering is done by skipping the measurements with empty or corrupted htraces.
        # This is done to avoid false positives in the analysis.
        # --------

        # Skip if there are no htraces
        if not htraces:
            return []

        # Package all the measurements into TraceBundles
        # and filter out the measurements with corrupted/ignored htraces
        measurements = []
        for i, htrace in enumerate(htraces):
            if htrace.is_empty() or htrace.is_corrupted_or_ignored():
                continue
            measurements.append(TraceBundle(i, inputs[i], ctraces[i], htrace))
        if not measurements:
            return []

        # Build a list of equivalence classes:
        all_classes = ContractEqClass.build_contract_classes(measurements)

        # Filter out ineffective equivalence classes
        effective_classes = [eq_cls for eq_cls in all_classes if len(eq_cls.measurements) >= 2]

        # Sort the classes by ctrace
        effective_classes.sort(key=lambda x: x.ctrace)

        # Compute hardware equivalence classes
        for eq_cls in effective_classes:
            hw_classes = HardwareEqClass.build_hw_classes(
                eq_cls.measurements, equivalence_function=self.htraces_are_equivalent)
            eq_cls.set_hw_classes(hw_classes)

        # Check if any of the equivalence classes is a contract counterexample
        violations: List[Violation] = []
        for eq_cls in effective_classes:
            hw_classes = eq_cls.get_hw_classes()
            if len(hw_classes) >= 2:
                v = Violation.from_contract_eq_class(eq_cls, inputs, test_case_code)
                violations.append(v)

        # Update statistics
        if stats_:
            STAT.eff_classes += len(effective_classes)
            STAT.single_entry_classes += len(all_classes) - len(effective_classes)
            STAT.analysed_test_cases += 1

        return violations


class MergedBitmapAnalyser(EquivalenceAnalyserCommon):
    """ A variant of the analyser that compares the htraces as merged bitmaps. I.e., it merges
    the htrace lists into bitmaps and compares the results.

    It also applies filtering of outliers according to CONF.analyser_outliers_threshold
    """

    _bitmap_cache: Final[Dict[int, int]]
    _MASK: Final[int]

    def __init__(self) -> None:
        super().__init__()
        self._bitmap_cache = {}
        self._MASK = pow(2, 64) - 1

    def htraces_are_equivalent(self, htrace1: HTrace, htrace2: HTrace) -> bool:
        bitmaps = [0, 0]

        sample_size = htrace1.sample_size()
        assert sample_size == htrace2.sample_size(), "htraces have different sizes"
        threshold = CONF.analyser_outliers_threshold * sample_size

        for i, htrace in enumerate([htrace1, htrace2]):
            hash_ = hash(htrace)
            raw = htrace.get_raw_traces()

            # check if cached
            if hash_ in self._bitmap_cache:
                bitmaps[i] = self._bitmap_cache[hash_]
                continue

            # remove outliers
            counter = Counter(raw)
            filtered = [x for x in raw if counter[x] >= threshold]

            # merge into bitmap
            for t in filtered:
                bitmaps[i] |= int(t)

            # cache
            self._bitmap_cache[hash_] = bitmaps[i]

        if CONF.analyser_subsets_is_violation:
            return bitmaps[0] == bitmaps[1]

        # check if the bitmaps are disjoint
        inverse = [~bitmaps[0] & self._MASK, ~bitmaps[1] & self._MASK]
        return bool(((bitmaps[0] & inverse[1]) == 0) or ((bitmaps[1] & inverse[0]) == 0))


class SetAnalyser(EquivalenceAnalyserCommon):
    """ A variant of the analyser that compares the htraces as sets. I.e., it squashes
    the htrace lists into sets and compares the results.

    It also applies filtering of outliers according to CONF.analyser_outliers_threshold
    """

    def htraces_are_equivalent(self, htrace1: HTrace, htrace2: HTrace) -> bool:
        """ Squash the htrace lists into sets and compare the results """
        sample_size = htrace1.sample_size()
        assert sample_size == htrace2.sample_size(), "htraces have different sizes"
        threshold = CONF.analyser_outliers_threshold * sample_size
        filtered1 = [x for x in htrace1.get_raw_traces() if x >= threshold]
        filtered2 = [x for x in htrace2.get_raw_traces() if x >= threshold]

        trace_set1 = set(filtered1)
        trace_set2 = set(filtered2)

        if CONF.analyser_subsets_is_violation:
            return trace_set1 == trace_set2

        return trace_set1.issubset(trace_set2) or trace_set2.issubset(trace_set1)


class MWUAnalyser(EquivalenceAnalyserCommon):
    """
    A variant of the analyser that uses the Mann-Withney U test to compare htraces.

    WARNING: this is an experimental analyser and it may not work well for all cases.
    """

    def __init__(self) -> None:
        super().__init__()
        warning("analyser",
                "MWUAnalyser is an experimental analyser and may not work well for all cases. ")

        a = [1] * CONF.executor_sample_sizes[0]
        b = [2] * CONF.executor_sample_sizes[0]
        _, p_value = stats.mannwhitneyu(a, b)
        if CONF.analyser_stat_threshold < p_value:
            raise ConfigException("analyser_stat_threshold is too high for the given sample size")

    def htraces_are_equivalent(self, htrace1: HTrace, htrace2: HTrace) -> bool:
        """ Use the Mann-Withney U test to compare htraces """
        _, p_value = stats.mannwhitneyu(htrace1.get_raw_traces(), htrace2.get_raw_traces())
        return bool(p_value > CONF.analyser_stat_threshold)


class ChiSquaredAnalyser(EquivalenceAnalyserCommon):
    """
    A variant of the analyser that uses the chi-squared test to compare htraces.
    """

    def __init__(self) -> None:
        super().__init__()
        a = [1] * CONF.executor_sample_sizes[0]
        b = [2] * CONF.executor_sample_sizes[0]
        stat = self.homogeneity_test(a, b)
        if CONF.analyser_stat_threshold > stat:
            error("analyser_stat_threshold is too low for the given sample size")

    def homogeneity_test(self, x: IntArrayLike, y: IntArrayLike) -> float:
        """ Use the chi-squared test to compare htraces """
        assert len(x) == len(y)
        counter1 = Counter(x)
        counter2 = Counter(y)
        keys = set(counter1.keys()) | set(counter2.keys())
        observed = [counter1[k] for k in keys] + [counter2[k] for k in keys]
        expected = [(counter1[k] + counter2[k]) / 2 for k in keys] * 2
        ddof = len(keys) - 1
        stat: float
        stat, _ = stats.chisquare(observed, expected, ddof=ddof)
        stat /= len(x) + len(y)
        return stat

    def htraces_are_equivalent(self, htrace1: HTrace, htrace2: HTrace) -> bool:
        stat = self.homogeneity_test(htrace1.get_raw_traces(), htrace2.get_raw_traces())
        return stat < CONF.analyser_stat_threshold


================================================
FILE: rvzr/arch/__init__.py
================================================


================================================
FILE: rvzr/arch/arm64/__init__.py
================================================


================================================
FILE: rvzr/arch/arm64/asm_parser.py
================================================
"""
File: Parsing of assembly files into our internal representation (TestCaseCode).
      This file contains arm64-specific code.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# FIXME: this implementation is quite brittle; rewrite it using a proper parser (keystone ?)

from __future__ import annotations
import re
from typing import TYPE_CHECKING, List

from rvzr.asm_parser import AsmParser, AsmLineParser, AsmParserError
from rvzr.instruction_spec import OT, InstructionSpec

from .target_desc import ARM64TargetDesc

if TYPE_CHECKING:
    from rvzr.isa_spec import InstructionSet
    from rvzr.target_desc import TargetDesc


# ==================================================================================================
# Private: Parser of assembly lines in ARM64 syntax
# ==================================================================================================
class _ARM646LineParser(AsmLineParser):
    """ Parser of assembly lines in ARM64 syntax """
    _target_desc: ARM64TargetDesc
    _curr_ln: int

    def __init__(self, isa_spec: InstructionSet, target_desc: ARM64TargetDesc) -> None:
        super().__init__(isa_spec, target_desc)
        self._comment_char = "//"
        self._re_tokenize = re.compile(
            r"^([^ .]+\.?)([^ ]+)? ([^ ,]+)(,[^,]+)?(,[^,]+)?(,[^,]+)?( //.*)?")
        self._re_tokenize_nops = re.compile(r"^([^ .]+\.?)([^ ]+)?")
        self._condition_code = list(target_desc.branch_conditions.keys())

    # ----------------------------------------------------------------------------------------------
    # Implementation of ISA-specific hooks
    def _tokenize(self, line: str) -> List[str]:
        matches = self._re_tokenize.findall(line)
        if matches == []:
            matches = self._re_tokenize_nops.findall(line)
        if not matches:
            raise AsmParserError(self._curr_ln, "Could not tokenize the line")
        tokens = [t.removeprefix(",") for t in matches[0] if t]
        # print(tokens)

        # the regex above splits memory address operands into multiple tokens
        # we need to merge them back
        tokens_merged = []
        mem_started = False
        mem_token = ""
        for token in tokens:
            if not token:
                continue
            if token[0] == "[" and token[-1] == "]":
                tokens_merged.append(token)
                continue
            if token[0] == "[":
                mem_started = True
                mem_token = token
                continue
            if token[-1] == "]":
                tokens_merged.append(mem_token + "," + token)
                mem_started = False
                mem_token = ""
                continue
            if mem_started:
                mem_token += "," + token
                continue
            tokens_merged.append(token)

        # print(tokens_merged)
        return tokens_merged

    def _get_instruction_name(self, line: str, tokens: List[str]) -> str:
        return tokens[0]

    def _get_instruction_operands(self, _: str, __: str, tokens: List[str]) -> List[str]:
        """ Get the list of operand strings from the tokens """
        return tokens[1:]

    def _get_initial_candidate_specs(self, _: str, name: str) -> List[InstructionSpec]:
        """ Get the list of candidate specs for an instruction with the given name  """
        return self._instruction_map.get(name, [])

    def _check_if_spec_matches(self, spec: InstructionSpec, operands_raw: List[str]) -> bool:
        """ Check if the given spec matches the given list of operand strings """
        # pylint: disable=too-many-return-statements  # justified for selectors
        # pylint: disable=too-many-branches  # justified for selectors
        # print(spec.name, operands_raw, spec.operands)

        if len(spec.operands) != len(operands_raw):
            return False

        for op_id, op_raw in enumerate(operands_raw):
            op_spec = spec.operands[op_id]

            # match condition
            if op_spec.type == OT.COND:
                if op_raw not in self._condition_code:
                    return False
                continue

            # match label
            if op_raw[0] == ".":
                if op_spec.type != OT.LABEL:
                    return False
                continue

            # match address
            if "[" in op_raw:
                if op_spec.type not in [OT.AGEN, OT.MEM]:
                    return False
                continue

            # match immediate value
            if op_raw[0] == "#":
                if op_spec.type != OT.IMM:
                    return False
                continue

            # match register
            if op_spec.type == OT.REG:
                if op_raw not in op_spec.values:
                    return False
                continue

            # match keyword immediate
            if op_spec.type == OT.IMM:
                if op_raw not in op_spec.values:
                    return False
                continue

            # no match
            return False
        return True


# ==================================================================================================
# Public Interface: Parser of X86 assembly files
# ==================================================================================================
class ARM64AsmParser(AsmParser):
    """ Implementation of the AsmParser interface for X86 assembly files """

    def __init__(self, isa_spec: InstructionSet, target_desc: TargetDesc) -> None:
        super().__init__(isa_spec, target_desc)
        assert isinstance(target_desc, ARM64TargetDesc)
        self._line_parser = _ARM646LineParser(isa_spec, target_desc)
        self._asm_patcher.set_macro_placeholder("nop; nop; nop")


================================================
FILE: rvzr/arch/arm64/config.py
================================================
"""
File: arm64-specific Configuration Options

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import List, Dict

_option_values = {
    'actor': [
        'name',
        'mode',
        'privilege_level',
        'data_properties',
        'data_ept_properties',
        'observer',
        'instruction_blocklist',
        'fault_blocklist',
    ],
    "actor_mode": ['host',],
    "actor_privilege_level": ['kernel',],
    "actor_data_properties": [
        'present',
        'writable',
        'user',
        'accessed',
        'dirty',
        'executable',
        'reserved_bit',
        'randomized',
    ],
    "actor_data_ept_properties": [
        "present",
        "writable",
        "executable",
        "accessed",
        "dirty",
        'reserved_bit',
        'randomized',
    ],
    'unicorn_instruction_categories': [
        "general-arithmetic",
        "general-barrier",
        "general-bitwise",
        "general-uncond_branch",
        "general-cond_branch",
        "general-comparison",
        "general-condsel",
        "general-dataxfer",
        "general-misc",
    ],
    "dr_instruction_categories": [
        # DynamoRIO backend is not yet supported on ARM
    ],
}

# in contrast to x86, on ARM64, we handle all fault types by default
_handled_faults: List[str] = ["PF", "DE", "DB", "BP", "BR", "UD", "PF", "GP"]

instruction_categories: List[str] = ["general-arithmetic", "general-dataxfer"]
""" instruction_categories: a default list of tested instruction categories """

_buggy_instructions: List[str] = []

instruction_blocklist: List[str] = [
]  # yapf: disable
instruction_blocklist.extend(_buggy_instructions)


register_blocklist: List[str] = [
    # free - x0 .. x5
    'x6', 'x7', 'x8', 'x9', 'x10', 'x11', 'x12', 'x13', 'x14', 'x15',
    'x16', 'x17', 'x18', 'x19', 'x20', 'x21', 'x22', 'x23',
    'x24', 'x25', 'x26', 'x27', 'x28', 'x29', 'x30', 'x31',
    'sp',
    'w6', 'w7', 'w8', 'w9', 'w10', 'w11', 'w12', 'w13', 'w14', 'w15',
    'w16', 'w17', 'w18', 'w19', 'w20', 'w21', 'w22', 'w23',
    'w24', 'w25', 'w26', 'w27', 'w28', 'w29', 'w30', 'w31',
    'wsp', 'wpc',
    'xzr', 'wzr',
]  # yapf: disable


# FIXME: this is copied from x86, needs to be adapted for ARM64
_generator_fault_to_fault_name: Dict[str, str] = {
    'div-by-zero': "DE",
    'div-overflow': "DE",
    'opcode-undefined': "UD",
    'breakpoint': "BP",
    'debug-register': "DB",
    'non-canonical-access': "GP",
    'user-to-kernel-access': "PF",
}

_actor_default = {
    'name': "main",
    'mode': "host",
    'privilege_level': "kernel",
    'observer': False,
    'data_properties': {
        'present': True,
        'writable': True,
        'user': False,
        'accessed': True,
        'executable': False,
        'randomized': False,
    },
    'data_ept_properties': {
        'present': True,
        'writable': True,
        'executable': False,
        'accessed': True,
        'user': False,
        'randomized': False,
    },
    'instruction_blocklist': set(),
    'fault_blocklist': set(),
}


================================================
FILE: rvzr/arch/arm64/executor.py
================================================
"""
File: Implementation of executor for arm64 architecture

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

from rvzr.executor import Executor
from rvzr.config import ConfigException
from rvzr.target_desc import TargetDesc


class ARM64Executor(Executor):
    """ ARM-specific implementation of the executor """

    def __init__(self, enable_mismatch_check_mode: bool = False):
        super().__init__(enable_mismatch_check_mode)
        self._vendor = TargetDesc.get_vendor()
        if self._vendor != "ARM":
            raise ConfigException(
                "Attempting to run ARM64Executor executor on a non-ARM CPUs!\n"
                "Change the `executor` configuration option to the appropriate vendor value.")

    def _set_vendor_specific_features(self) -> None:
        pass


================================================
FILE: rvzr/arch/arm64/fuzzer.py
================================================
"""
File: arm64 implementation of the test case generator

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import TYPE_CHECKING, List, Generator
from contextlib import contextmanager
import tempfile
import os

from rvzr.fuzzer import Fuzzer, ArchitecturalFuzzer, ArchDiffFuzzer
from rvzr.traces import HTrace
from rvzr.tc_components.test_case_data import InputData
from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.stats import FuzzingStats
from rvzr.config import CONF
from .executor import ARM64Executor

if TYPE_CHECKING:
    from rvzr.asm_parser import AsmParser
    from rvzr.elf_parser import ELFParser
    from rvzr.code_generator import CodeGenerator
    from rvzr.executor import Executor

STAT = FuzzingStats()


# ==================================================================================================
# ARM64-specific Implementation of the Fuzzer
# ==================================================================================================
class ARM64Fuzzer(Fuzzer):
    """
    Implementation of the standard fuzzing mode for the arm64 architecture.

    Extends the generic Fuzzer class with:
    1. Checking of the instruction set for compatibility with the required faults
    2. Filtering of non-useful test cases with a Speculation Filter and an Observation Filter
    """

    executor: ARM64Executor

    # ----------------------------------------------------------------------------------------------
    # Private Methods
    def _filter(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        """
        This function implements a multi-stage algorithm that gradually filters out
        uninteresting test cases

        :param test_case: the target test case
        :param inputs: list of inputs to be tested
        :return: True if the test case should be filtered out; False otherwise
        """
        # Exit if all filters are disabled
        if not CONF.enable_observation_filter:
            return False

        # Number of repetitions for each input
        reps = CONF.executor_filtering_repetitions

        with _quick_and_dirty_mode(self.executor):  # Speed up the execution by disabling checks
            # Collect hardware traces for the test case
            try:
                self.executor.load_test_case(test_case)
                org_htraces = self.executor.trace_test_case(inputs, reps)
            except IOError:
                return True

            if self._observation_filter(test_case, inputs, reps, org_htraces):
                return True

            return False

    def _observation_filter(self, test_case: TestCaseProgram, inputs: List[InputData], reps: int,
                            org_htraces: List[HTrace]) -> bool:
        """
        Check if any of the htraces contain a speculative cache eviction
        for this create a fenced version of the test case and collect traces for it
        :param test_case: the target test case
        :param inputs: list of inputs to be tested
        :param reps: number of repetitions for each input
        :param org_htraces: list of HTrace objects collected while executing the test case
        :return: True if the test case should be filtered out; False otherwise
        """
        if not CONF.enable_observation_filter:
            return False

        with tempfile.NamedTemporaryFile(delete=False) as fenced:
            fenced_name = fenced.name
        fenced_test_case = _create_fenced_test_case(test_case.asm_path(), fenced_name,
                                                    self.asm_parser, self.code_gen, self.elf_parser)
        try:
            self.executor.load_test_case(fenced_test_case)
            fenced_htraces = self.executor.trace_test_case(inputs, reps)
        except IOError:
            return True  # skip the test case if there is an error
        os.remove(fenced.name)

        traces_match = True
        for i, _ in enumerate(inputs):
            if not self.analyser.htraces_are_equivalent(fenced_htraces[i], org_htraces[i]):
                traces_match = False
                break
        if traces_match:
            STAT.observ_filter += 1
            return True

        return False


# ==================================================================================================
# Non-standard Fuzzers
# ==================================================================================================
class ARM64ArchitecturalFuzzer(ArchitecturalFuzzer):
    """
    ARM64-specific implementation of the ArchitecturalFuzzer.
    """
    # No ARM64-specific implementation is needed


class ARM64ArchDiffFuzzer(ArchDiffFuzzer):
    """
    ARM64-specific implementation of the ArchDiffFuzzer.
    """

    @staticmethod
    def _create_fenced_test_case(original_asm: str, fenced_asm: str, asm_parser: AsmParser,
                                 generator: CodeGenerator,
                                 elf_parser: ELFParser) -> TestCaseProgram:
        return _create_fenced_test_case(original_asm, fenced_asm, asm_parser, generator, elf_parser)


# ==================================================================================================
# Helper functions
# ==================================================================================================
@contextmanager
def _quick_and_dirty_mode(executor: Executor) -> Generator[None, None, None]:
    """
    Context manager that enables us to use quick and dirty mode in the form of `with` statement
    """
    try:
        executor.set_quick_and_dirty(True)
        yield
    finally:
        executor.set_quick_and_dirty(False)


def _create_fenced_test_case(original_asm: str, fenced_asm: str, asm_parser: AsmParser,
                             generator: CodeGenerator, elf_parser: ELFParser) -> TestCaseProgram:
    """ Add fences to all instructions in the test case """
    with open(original_asm, 'r') as f:
        with open(fenced_asm, 'w') as fenced_file:
            for line in f:
                fenced_file.write(line)
                line = line.strip().lower()
                if line and line[0] not in ["/", ".", "b"] \
                        and "macro" not in line:
                    fenced_file.write('dsb SY\n isb\n')
    fenced_test_case = asm_parser.parse_file(fenced_asm, generator, elf_parser)
    return fenced_test_case


================================================
FILE: rvzr/arch/arm64/generator.py
================================================
"""
File: arm64 implementation of the test case generator

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import math
import random
from typing import List, Dict, TYPE_CHECKING, Tuple, Callable, Literal

from rvzr.code_generator import CodeGenerator, Pass, Printer
from rvzr.sandbox import SandboxLayout, DataArea
from rvzr.instruction_spec import InstructionSpec
from rvzr.tc_components.instruction import Instruction, Operand, RegisterOp, FlagsOp, \
    MemoryOp, ImmediateOp, AgenOp, CondOp
from rvzr.tc_components.test_case_code import TestCaseProgram, BasicBlock, InstructionNode

from .target_desc import ARM64TargetDesc

if TYPE_CHECKING:
    from rvzr.elf_parser import ELFParser
    from rvzr.asm_parser import AsmParser
    from rvzr.isa_spec import InstructionSet
    from rvzr.target_desc import TargetDesc


# ==================================================================================================
# Private: Assembly Printing
# ==================================================================================================
class _ARM64Printer(Printer):

    def __init__(self, target_desc: ARM64TargetDesc) -> None:
        super().__init__(target_desc)
        self.prologue_template = [""]
        self.epilogue_template = [
            ".section .data.main\n",
            ".test_case_exit:nop\n",
        ]

    def _instruction_to_str(self, inst: Instruction) -> str:
        """
        Override to handle ARM64 conditional operands.
        """
        if inst.name == "macro":
            return self._macro_to_str(inst)

        # Handle conditional operands specially for ARM64
        cond_op_str = ""
        operands = list(inst.operands)
        if operands and isinstance(operands[0], CondOp):
            cond_op_str = operands[0].value
            operands = operands[1:]

        operands_str = ", ".join([self._operand_to_str(op) for op in operands])
        if inst.is_instrumentation:
            comment = "// instrumentation"
        elif inst.is_noremove:
            comment = "// noremove"
        else:
            comment = ""
        return f"{inst.name}{cond_op_str} {operands_str} {comment}"

    def _operand_to_str(self, op: Operand) -> str:
        if isinstance(op, (MemoryOp, AgenOp)):
            return f"[{op.value}]"
        if isinstance(op, ImmediateOp):
            if self._is_digit_extended(op.value):
                return f"#{op.value}"
            return f"{op.value}"

        return op.value

    def _macro_to_str(self, inst: Instruction) -> str:
        macro_placeholder = "nop; nop; nop"
        if inst.operands[1].value.lower() == ".noarg":
            return f".macro{inst.operands[0].value}: {macro_placeholder}"
        return f".macro{inst.operands[0].value}{inst.operands[1].value}: {macro_placeholder}"

    @staticmethod
    def _is_digit_extended(s: str) -> bool:
        """
        An extended version of the is_digit function. The difference is that is_digit
        handles only decimal numbers, while this function can handle hex and binary
        numbers as well.
        """
        try:
            base = 10
            if s.startswith("0x"):
                base = 16
            if s.startswith("0b"):
                base = 2
            int(s, base)
            return True
        except ValueError:
            return False


# ==================================================================================================
# Private: Collection of Instrumentation Passes
# ==================================================================================================

_DispatcherKey = Literal["memory"]
_SandboxDispatcher = Dict[_DispatcherKey, Tuple[List[InstructionNode],
                                                Callable[[InstructionNode, BasicBlock], None]]]


class _ARM64SandboxPass(Pass):
    """
    A pass that instruments the test case to prevent certain types of faults,
    including:
    - out-of-sandbox memory accesses
    - ... (more to be added in the future)

    NOTE: in contrast to x86, arm64 does not fault on div by zero, so no need to
    sandbox division instructions
    """

    # pylint: disable=R0801
    # NOTE: there's an overlap between this class and it's equivalent in x86/generator.py
    # This is acceptable for now as functions are different enough so that deduplication
    # would hurt readability

    def __init__(self, target_desc: TargetDesc) -> None:
        super().__init__()
        self.target_desc = target_desc

        size_of_directly_accessible_memory = SandboxLayout.data_area_size(DataArea.MAIN) \
            + SandboxLayout.data_area_size(DataArea.FAULTY)
        mask_width = int(math.log(size_of_directly_accessible_memory, 2))
        self.sandbox_address_mask = "#0b" + "1" * mask_width

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        dispatcher: _SandboxDispatcher = {
            "memory": ([], self._sandbox_memory_access),
        }

        for bb in test_case.iter_basic_blocks():
            dispatcher["memory"][0].clear()

            # collect all instructions that require sandboxing
            for node in bb.iter_nodes():
                inst = node.instruction
                if inst.is_instrumentation or inst.is_from_template:
                    continue

                if inst.has_mem_operand(True):
                    dispatcher["memory"][0].append(node)

            # sandbox them
            for _, (nodes, sandbox_func) in dispatcher.items():
                for node in nodes:
                    sandbox_func(node, bb)

    def _sandbox_memory_access(self, node: InstructionNode, parent: BasicBlock) -> None:
        """ Force the memory accesses into the page starting from x20 """

        instr = node.instruction

        # if implicit_mem_operands:
        #     raise GeneratorException("Implicit memory accesses are not supported")

        # raise GeneratorException("Attempt to sandbox an instruction without memory operands")

        mem_operands = instr.get_mem_operands(True)
        implicit_mem_operands = \
            instr.get_mem_operands(include_explicit=False, include_implicit=True)
        mask = self.sandbox_address_mask

        if mem_operands and not implicit_mem_operands:
            assert len(mem_operands) == 1, \
                f"Instructions with multiple memory accesses are not yet supported: {instr.name}"
            mem_operand = mem_operands[0]
            address_reg = mem_operand.value
            imm_width = mem_operand.width if mem_operand.width <= 32 else 32
            apply_mask = Instruction("and", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, mem_operand.width, False, True)) \
                .add_op(RegisterOp(address_reg, mem_operand.width, True, False)) \
                .add_op(ImmediateOp(mask, imm_width)) \
                .add_op(FlagsOp(("w", "", "", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, apply_mask)
            add_base = Instruction("add", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, mem_operand.width, False, True)) \
                .add_op(RegisterOp(address_reg, mem_operand.width, True, False)) \
                .add_op(RegisterOp("x20", 64, True, False)) \
                .add_op(FlagsOp(("w", "", "", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, add_base)
            return

        raise NotImplementedError("Implicit memory accesses are not yet supported")

    @staticmethod
    def requires_sandbox(inst: InstructionSpec) -> bool:
        """ Check if the instruction requires instrumentation to prevent faults """
        if inst.has_mem_operand:
            return True
        return False


class _ARM64PatchUndefinedLoadsPass(Pass):

    def __init__(self, target_desc: TargetDesc) -> None:
        super().__init__()
        self.target_desc = target_desc

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        for bb in test_case.iter_basic_blocks():
            to_patch: List[Instruction] = []

            for node in bb.iter_nodes():
                inst = node.instruction

                if inst.is_instrumentation or inst.is_from_template:
                    continue

                # check if it's a load with post-index
                if self._is_post_index(inst):
                    to_patch.append(inst)

            # fix operands
            for inst in to_patch:
                org_dest = inst.operands[0]
                assert isinstance(org_dest, RegisterOp)
                assert org_dest.width in self.target_desc.registers_by_size
                options = self.target_desc.registers_by_size[org_dest.width]
                options = [i for i in options if i != org_dest.value]
                new_value = random.choice(options)
                inst.operands[0].value = new_value

    def _is_post_index(self, inst: Instruction) -> bool:
        if "ldr" not in inst.name and "str" not in inst.name:
            return False
        if inst.get_imm_operands() == []:
            return False

        ops = inst.operands
        assert isinstance(ops[0], RegisterOp)
        assert isinstance(ops[1], MemoryOp)
        normalized_dest = self.target_desc.reg_normalized[ops[0].value]
        normalized_dest = self.target_desc.reg_denormalized[normalized_dest][64]
        if normalized_dest in ops[1].value:
            return True
        return False


# ==================================================================================================
# Public Interface
# ==================================================================================================
class ARM64Generator(CodeGenerator):
    """ arm64-specific implementation of the test case program generator """

    def __init__(self, seed: int, instruction_set: InstructionSet, target_desc: TargetDesc,
                 asm_parser: AsmParser, elf_parser: ELFParser) -> None:
        super().__init__(seed, instruction_set, target_desc, asm_parser, elf_parser)
        assert isinstance(self._target_desc, ARM64TargetDesc)

        # configure instrumentation passes
        self._passes = [
            _ARM64SandboxPass(self._target_desc),
            _ARM64PatchUndefinedLoadsPass(self._target_desc),
        ]
        self._printer = _ARM64Printer(self._target_desc)


================================================
FILE: rvzr/arch/arm64/get_spec.py
================================================
"""
File: A script that downloads the ARM64 instruction set
      and parses it into a JSON file that can be used by the generator.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import List
import shutil

from rvzr.logs import warning, inform


class Downloader:
    """ A class that downloads the ARM64 instruction set and converts it to JSON """

    def __init__(self, extensions: List[str], out_file: str) -> None:
        self._extensions = extensions
        self._out_file = out_file
        warning(
            "downloader", "The ARM64 spec retrieval is not implemented yet, \n"
            "and this script will just copy a spec file from tests/arm64/min_arm64.json")

    def run(self) -> None:
        """ Run the downloader """
        shutil.copy("tests/arm64/min_arm64.json", self._out_file)
        inform("downloader", f"ARM64 spec is copied to {self._out_file}")


================================================
FILE: rvzr/arch/arm64/target_desc.py
================================================
"""
File: arm64-specific constants and lists

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import List
import re
import unicorn.arm64_const as ucc  # type: ignore

from rvzr.tc_components.instruction import Instruction
from rvzr.target_desc import TargetDesc, CPUDesc, UnicornTargetDesc


class ARM64TargetDesc(TargetDesc):
    """ Target description for arm64 architecture. """

    register_sizes = {
        "w0": 32, "w1": 32, "w2": 32, "w3": 32, "w4": 32, "w5": 32, "w6": 32, "w7": 32,
        "wsp": 32, "wzr": 32,
        "x0": 64, "x1": 64, "x2": 64, "x3": 64, "x4": 64, "x5": 64, "x6": 64, "x7": 64,
        "sp": 64, "xsp": 64, "xzr": 64,
    }  # yapf: disable

    registers_by_size = {
        32: ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7"],
        64: ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7"],
    }  # yapf: disable

    reg_normalized = {
        "w0": "R0", "x0": "R0",
        "w1": "R1", "x1": "R1",
        "w2": "R2", "x2": "R2",
        "w3": "R3", "x3": "R3",
        "w4": "R4", "x4": "R4",
        "w5": "R5", "x5": "R5",
        "w6": "R6", "x6": "R6",
        "w7": "R7", "x7": "R7",
        "w8": "R8", "x8": "R8",
        "w9": "R9", "x9": "R9",
        "w10": "R10", "x10": "R10",
        "w20": "R20", "x20": "R20",
        "w30": "R30", "x30": "R30",
        "CF": "CF", "ZF": "ZF", "SF": "SF", "OF": "OF",
        "pc": "RIP",
        "sp": "RSP", "wsp": "RSP", "xsp": "RSP",
    }  # yapf: disable

    reg_denormalized = {
        "R0": {64: "x0", 32: "w0"},
        "R1": {64: "x1", 32: "w1"},
        "R2": {64: "x2", 32: "w2"},
        "R3": {64: "x3", 32: "w3"},
        "R4": {64: "x4", 32: "w4"},
        "R5": {64: "x5", 32: "w5"},
        "R6": {64: "x6", 32: "w6"},
        "R7": {64: "x7", 32: "w7"},
        "R20": {64: "x20", 32: "w20"},
        "R30": {64: "x30", 32: "w30"},
        "RIP": {64: "pc"},
        "RSP": {64: "sp", 32: "wsp"},
    }  # yapf: disable

    mem_index_registers = ["x0", "x1", "x2", "x3", "x4", "x5"]

    page_property_to_pte_bit_name = {
        "present": ("valid", False),
        "writable": ("non_writable", True),
        "user": ("user", False),
        "accessed": ("accessed", False),
        "executable": ("non_executable", True),
    }

    pte_bits = {
        "valid": (0, True),
        "user": (6, False),
        "non_writable": (7, False),
        "accessed": (10, True),
        "non_executable": (53, True),
    }

    # FIXME: EPTE is not yet supported on ARM64; this is a placeholder
    page_property_to_vm_pte_bit_name = {
        "present": ("valid", False),
        "writable": ("non_writable", True),
        "user": ("user", False),
        "accessed": ("accessed", False),
        "executable": ("non_executable", True),
    }

    # FIXME: EPTE is not yet supported on ARM64; this is a placeholder
    vm_pte_bits = {
        "valid": (0, True),
        "user": (0, False),
        "non_writable": (0, False),
        "accessed": (0, True),
        "non_executable": (0, True),
    }

    branch_conditions = {
        "eq": ["", "", "", "r", "", "", "", "", ""],
        "ne": ["", "", "", "r", "", "", "", "", ""],
        "cs": ["r", "", "", "", "", "", "", "", ""],
        "cc": ["r", "", "", "", "", "", "", "", ""],
        "mi": ["", "", "", "", "r", "", "", "", ""],
        "pl": ["", "", "", "", "r", "", "", "", ""],
        "vs": ["", "", "", "", "", "", "", "", "r"],
        "vc": ["", "", "", "", "", "", "", "", "r"],
        "hi": ["r", "", "", "r", "", "", "", "", ""],
        "ls": ["r", "", "", "r", "", "", "", "", ""],
        "ge": ["", "", "", "", "r", "", "", "", "r"],
        "lt": ["", "", "", "", "r", "", "", "", "r"],
        "gt": ["", "", "", "r", "r", "", "", "", "r"],
        "le": ["", "", "", "r", "r", "", "", "", "r"],
        "al": ["", "", "", "", "", "", "", "", ""]
    }

    def __init__(self) -> None:
        super().__init__()

        # modify/set target parameters based on the CPU under test and the configuration
        self.registers_by_size = self._filter_blocked_registers()
        self.cpu_desc = self._build_cpu_desc()

        # connect Unicorn TD
        self.uc_target_desc = ARM64UnicornTargetDesc()

    @staticmethod
    def is_unconditional_branch(inst: Instruction) -> bool:
        return inst.name == "b"

    @staticmethod
    def is_call(inst: Instruction) -> bool:
        return inst.name == "bl"

    def _build_cpu_desc(self) -> CPUDesc:
        vendor = self.get_vendor()

        with open("/proc/cpuinfo") as f:
            cpuinfo = f.read()

            family_match = re.search(r"CPU architecture\s*:\s+(.*)", cpuinfo)
            assert family_match, "Failed to find family in /proc/cpuinfo"
            family = int(family_match.group(1), 16)

            model_match = re.search(r"CPU variant\s+:\s+(.*)", cpuinfo)
            assert model_match, "Failed to find model name in /proc/cpuinfo"
            model = int(model_match.group(1), 16)

            stepping_match = re.search(r"CPU part\s+:\s+(.*)", cpuinfo)
            assert stepping_match, "Failed to find stepping in /proc/cpuinfo"
            stepping = int(stepping_match.group(1), 16)

        return CPUDesc(vendor, model, family, stepping)


class ARM64UnicornTargetDesc(UnicornTargetDesc):  # pylint: disable=too-few-public-methods
    """ arm64 target description in the context of a Unicorn-based model. """

    usable_registers: List[int] = [
        ucc.UC_ARM64_REG_X0, ucc.UC_ARM64_REG_X1, ucc.UC_ARM64_REG_X2, ucc.UC_ARM64_REG_X3,
        ucc.UC_ARM64_REG_X4, ucc.UC_ARM64_REG_X5, ucc.UC_ARM64_REG_NZCV, ucc.UC_ARM64_REG_SP
    ]

    usable_simd128_registers: List[int] = []

    reg_str_to_constant = {
        "x0": ucc.UC_ARM64_REG_X0,
        "x1": ucc.UC_ARM64_REG_X1,
        "x2": ucc.UC_ARM64_REG_X2,
        "x3": ucc.UC_ARM64_REG_X3,
        "x4": ucc.UC_ARM64_REG_X4,
        "x5": ucc.UC_ARM64_REG_X5,
        "x6": ucc.UC_ARM64_REG_X6,
        "x7": ucc.UC_ARM64_REG_X7,
        "x8": ucc.UC_ARM64_REG_X8,
        "x9": ucc.UC_ARM64_REG_X9,
        "x10": ucc.UC_ARM64_REG_X10,
        "x11": ucc.UC_ARM64_REG_X11,
        "x12": ucc.UC_ARM64_REG_X12,
        "x13": ucc.UC_ARM64_REG_X13,
        "x14": ucc.UC_ARM64_REG_X14,
        "x15": ucc.UC_ARM64_REG_X15,
        "x16": ucc.UC_ARM64_REG_X16,
        "x17": ucc.UC_ARM64_REG_X17,
        "x18": ucc.UC_ARM64_REG_X18,
        "x19": ucc.UC_ARM64_REG_X19,
        "x20": ucc.UC_ARM64_REG_X20,
        "x21": ucc.UC_ARM64_REG_X21,
        "x22": ucc.UC_ARM64_REG_X22,
        "x23": ucc.UC_ARM64_REG_X23,
        "x24": ucc.UC_ARM64_REG_X24,
        "x25": ucc.UC_ARM64_REG_X25,
        "x26": ucc.UC_ARM64_REG_X26,
        "x27": ucc.UC_ARM64_REG_X27,
        "x28": ucc.UC_ARM64_REG_X28,
        "x29": ucc.UC_ARM64_REG_X29,
        "x30": ucc.UC_ARM64_REG_X30
    }

    reg_norm_to_constant = {
        "R0": ucc.UC_ARM64_REG_X0,
        "R1": ucc.UC_ARM64_REG_X1,
        "R2": ucc.UC_ARM64_REG_X2,
        "R3": ucc.UC_ARM64_REG_X3,
        "R4": ucc.UC_ARM64_REG_X4,
        "R5": ucc.UC_ARM64_REG_X5,
        "R6": ucc.UC_ARM64_REG_X6,
        "R7": ucc.UC_ARM64_REG_X7,
        "R20": ucc.UC_ARM64_REG_X20,
        "R30": ucc.UC_ARM64_REG_X30,
        "FLAGS": ucc.UC_ARM64_REG_NZCV,
        "SF": ucc.UC_ARM64_REG_NZCV,  # N
        "ZF": ucc.UC_ARM64_REG_NZCV,  # Z
        "CF": ucc.UC_ARM64_REG_NZCV,  # C
        "OF": ucc.UC_ARM64_REG_NZCV,  # V
        "RIP": -1,
        "RSP": -1,
    }

    barriers: List[str] = ['dmb', 'dsb', 'isb']
    flags_register: int = ucc.UC_ARM64_REG_NZCV
    pc_register: int = ucc.UC_ARM64_REG_PC
    sp_register: int = ucc.UC_ARM64_REG_SP
    actor_base_register: int = ucc.UC_ARM64_REG_X20


================================================
FILE: rvzr/arch/x86/__init__.py
================================================


================================================
FILE: rvzr/arch/x86/asm_parser.py
================================================
"""
File: Parsing of assembly files into our internal representation (TestCaseCode).
      This file contains x86-specific code.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
import re
from typing import TYPE_CHECKING, List

from rvzr.asm_parser import AsmParser, AsmLineParser, asm_parser_assert
from rvzr.instruction_spec import OT, InstructionSpec

if TYPE_CHECKING:
    from rvzr.isa_spec import InstructionSet
    from rvzr.target_desc import TargetDesc

# ==================================================================================================
# Private: Parser of assembly lines in Intel syntax
# ==================================================================================================
_PATTERN_CONST_INT = re.compile("^-?[0-9]+$")
_PATTERN_CONST_HEX = re.compile("^-?0x[0-9abcdef]+$")
_PATTERN_CONST_BIN = re.compile("^-?0b[01]+$")
_PATTERN_CONST_SUM = re.compile("^-?[0-9]+ *[+-] *[0-9]+$")

_ASM_PREFIXES = ["lock", "rex", "rep", "repe", "repne"]
_ASM_SYNONYMS = {
    "je": "jz",
    "jne": "jnz",
    "jnae": "jb",
    "jc": "jb",
    "jae": "jnb",
    "jnc": "jnb",
    "jna": "jbe",
    "ja": "jnbe",
    "jnge": "jl",
    "jge": "jnl",
    "jng": "jle",
    "jg": "jnle",
    "jpe": "jp",
    "jpo": "jnp",
    "cmove": "cmovz",
    "cmovne": "cmovnz",
    "cmovnae": "cmovb",
    "cmovc": "cmovb",
    "cmovae": "cmovnb",
    "cmovnc": "cmovnb",
    "cmovna": "cmovbe",
    "cmova": "cmovnbe",
    "cmovnge": "cmovl",
    "cmovge": "cmovnl",
    "cmovng": "cmovle",
    "cmovg": "cmovnle",
    "cmovpe": "cmovp",
    "cmovpo": "cmovnp",
    "sete": "setz",
    "setne": "setnz",
    "setnae": "setb",
    "setc": "setb",
    "setae": "setnb",
    "setnc": "setnb",
    "setna": "setbe",
    "seta": "setnbe",
    "setnge": "setl",
    "setge": "setnl",
    "setng": "setle",
    "setg": "setnle",
    "setpe": "setp",
    "setpo": "setnp",
    "movabs": "mov",
    "repe": "repz",
    "repne": "repnz",
    "repnz": "repne",
    "repz": "repe",
}
_MEMORY_SIZES = {
    "byte": 8,
    "word": 16,
    "dword": 32,
    "qword": 64,
    "tbyte": 80,
    "xmmword": 128,
    "ymmword": 256,
    "zmmword": 512
}


class _X86IntelLineParser(AsmLineParser):
    _curr_ln: int

    def __init__(self, isa_spec: InstructionSet, target_desc: TargetDesc) -> None:
        super().__init__(isa_spec, target_desc)
        self._comment_char = "#"

    # ----------------------------------------------------------------------------------------------
    # Implementation of ISA-specific hooks
    def _tokenize(self, line: str) -> List[str]:
        return []  # no need to tokenize in this implementation

    def _get_instruction_name(self, line: str, _: List[str]) -> str:
        """ Get the name of the instruction from an assembly line, including prefixes """
        name = ""
        for word in line.split():
            if word in _ASM_PREFIXES:
                name += word + " "
                continue
            name += word
            break
        return name

    def _get_instruction_operands(self, line: str, name: str, tokens: List[str]) -> List[str]:
        """ Get the list of operand strings from an assembly line """
        operands_raw = line.removeprefix(name).split(",")
        if operands_raw == [""]:  # no operands
            return []
        operands_raw = [o.strip() for o in operands_raw]  # remove spaces
        return operands_raw

    def _get_initial_candidate_specs(self, line: str, _: str) -> List[InstructionSpec]:
        """ Get the list of candidate specs for an instruction with the given name  """
        key = ""
        for word in line.split():
            # include prefixes in the key
            if word in _ASM_PREFIXES:
                key += word + " "
                continue

            # fix jump name
            if word in _ASM_SYNONYMS:
                key += _ASM_SYNONYMS[word]
            else:
                key += word
            return self._instruction_map.get(key, [])
        return []

    def _check_if_spec_matches(self, spec: InstructionSpec, operands_raw: List[str]) -> bool:
        """ Check if the given spec matches the given list of operand strings """
        # pylint: disable=too-many-return-statements  # justified for selectors

        if len(spec.operands) != len(operands_raw):
            return False

        for op_id, op_raw in enumerate(operands_raw):
            op_spec = spec.operands[op_id]

            # match label
            if op_raw[0] == ".":
                if op_spec.type != OT.LABEL:
                    return False
                continue

            # match address
            if "[" in op_raw:
                if op_spec.type not in [OT.AGEN, OT.MEM]:
                    return False

                access_size = op_raw.split()[0]  # match address size
                if access_size == "ptr":
                    # out internal convention is that "ptr" prefix matches any size
                    continue

                asm_parser_assert(access_size in _MEMORY_SIZES, self._curr_ln,
                                  f"Pointer size must be declared explicitly: {op_raw}")
                if op_spec.width != _MEMORY_SIZES[access_size]:
                    return False
                continue

            # match immediate value
            if _PATTERN_CONST_BIN.match(op_raw) or \
                    _PATTERN_CONST_HEX.match(op_raw) or \
                    _PATTERN_CONST_INT.match(op_raw) or \
                    _PATTERN_CONST_SUM.match(op_raw):
                if op_spec.type != OT.IMM:
                    return False
                continue

            # match register
            if op_spec.type == OT.REG:
                if op_raw not in op_spec.values:
                    return False
                continue
            return False
        return True


# ==================================================================================================
# Public Interface: Parser of X86 assembly files
# ==================================================================================================
class X86AsmParser(AsmParser):
    """ Implementation of the AsmParser interface for X86 assembly files """

    def __init__(self, isa_spec: InstructionSet, target_desc: TargetDesc) -> None:
        super().__init__(isa_spec, target_desc)
        self._line_parser = _X86IntelLineParser(isa_spec, target_desc)
        self._asm_patcher.set_macro_placeholder(" nop qword ptr [rax + 0xff]")


================================================
FILE: rvzr/arch/x86/config.py
================================================
"""
File: x86-specific Configuration Options

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import List

_option_values = {
    'actor': [
        'name',
        'mode',
        'privilege_level',
        'data_properties',
        'data_ept_properties',
        'observer',
        'instruction_blocklist',
        'fault_blocklist',
    ],
    "actor_mode": [
        'host',
        'guest',
    ],
    "actor_privilege_level": [
        'kernel',
        'user',
    ],
    "actor_data_properties": [
        'present',
        'writable',
        'user',
        'write-through',
        'cache-disable',
        'accessed',
        'dirty',
        'executable',
        'reserved_bit',
        'randomized',
    ],
    "actor_data_ept_properties": [
        "present",
        "writable",
        "executable",
        "accessed",
        "dirty",
        'reserved_bit',
        'randomized',
    ],
    'unicorn_instruction_categories': [
        # Base x86 - user instructions
        "BASE-BINARY",
        "BASE-BITBYTE",
        "BASE-CMOV",
        "BASE-COND_BR",
        "BASE-CONVERT",
        "BASE-DATAXFER",
        "BASE-FLAGOP",
        "BASE-LOGICAL",
        "BASE-MISC",
        "BASE-NOP",
        "BASE-POP",
        "BASE-PUSH",
        "BASE-SEMAPHORE",
        "BASE-SETCC",
        "BASE-STRINGOP",
        "BASE-WIDENOP",

        # Base x86 - system instructions
        "BASE-INTERRUPT",
        # "BASE-ROTATE",      # Unknown bug in Unicorn - emulated incorrectly
        # "BASE-SHIFT",       # Unknown bug in Unicorn - emulated incorrectly
        # "BASE-UNCOND_BR",   # Not supported: Complex control flow
        # "BASE-CALL",        # Not supported: Complex control flow
        # "BASE-RET",         # Not supported: Complex control flow
        # "BASE-SEGOP",       # Not supported: System instructions
        # "BASE-IO",          # Not supported: System instructions
        # "BASE-IOSTRINGOP",  # Not supported: System instructions
        # "BASE-SYSCALL",     # Not supported: System instructions
        # "BASE-SYSRET",      # Not supported: System instructions
        "BASE-SYSTEM",
        "LONGMODE-CONVERT",
        "LONGMODE-DATAXFER",
        "LONGMODE-SEMAPHORE",
        "LONGMODE-SYSCALL",
        "LONGMODE-SYSRET",

        # SIMD extensions
        "SSE-SSE",
        "SSE-DATAXFER",
        "SSE-MISC",
        "SSE-LOGICAL_FP",
        # "SSE-CONVERT",  # require MMX
        # "SSE-PREFETCH",  # prefetch does not trigger a mem access in unicorn
        "SSE2-SSE",
        "SSE2-DATAXFER",
        "SSE2-MISC",
        "SSE2-LOGICAL_FP",
        "SSE2-LOGICAL",
        # "SSE2-CONVERT",  # require MMX
        # "SSE2-MMX",   # require MMX
        "SSE3-SSE",
        "SSE3-DATAXFER",
        # "SSE4-SSE",  # not tested yet
        "SSE4-LOGICAL",
        "SSE4a-BITBYTE",
        "SSE4a-DATAXFER",

        # Misc
        "CLFLUSHOPT-CLFLUSHOPT",
        "CLFSH-MISC",
        # "MPX-MPX",  # no longer supported
        "SMX-SYSTEM",
        "VTX-VTX",
        "XSAVE-XSAVE",
    ],
    "dr_instruction_categories": [
        # Base x86 - user instructions
        "BASE-BINARY",
        "BASE-BITBYTE",
        "BASE-CMOV",
        "BASE-COND_BR",
        "BASE-CONVERT",
        "BASE-DATAXFER",
        "BASE-FLAGOP",
        "BASE-LOGICAL",
        "BASE-MISC",
        "BASE-NOP",
        "BASE-POP",
        "BASE-PUSH",
        "BASE-SEMAPHORE",
        "BASE-SETCC",
        "BASE-STRINGOP",
        "BASE-WIDENOP",

        # Base x86 - system instructions
        "BASE-INTERRUPT",
        "BASE-ROTATE",
        "BASE-SHIFT",
        # "BASE-UNCOND_BR",   # Not supported: Complex control flow
        # "BASE-CALL",        # Not supported: Complex control flow
        # "BASE-RET",         # Not supported: Complex control flow
        # "BASE-SEGOP",       # Not supported: System instructions
        # "BASE-IO",          # Not supported: System instructions
        # "BASE-IOSTRINGOP",  # Not supported: System instructions
        # "BASE-SYSCALL",     # Not supported: System instructions
        # "BASE-SYSRET",      # Not supported: System instructions
        "BASE-SYSTEM",
        "LONGMODE-CONVERT",
        "LONGMODE-DATAXFER",
        "LONGMODE-SEMAPHORE",
        "LONGMODE-SYSCALL",
        "LONGMODE-SYSRET",

        "3DNOW_PREFETCH-PREFETCH",
        "ADOX_ADCX-ADOX_ADCX",
        "BASE-BINARY",
        "BASE-BITBYTE",
        "BASE-CMOV",
        "BASE-COND_BR",
        "BASE-CONVERT",
        "BASE-DATAXFER",
        "BASE-FLAGOP",
        "BASE-LOGICAL",
        "BASE-MISC",
        "BASE-NOP",
        "BASE-POP",
        "BASE-PUSH",
        "BASE-ROTATE",
        "BASE-SEMAPHORE",
        "BASE-SETCC",
        "BASE-SHIFT",
        "BASE-WIDENOP",
        "LONGMODE-CONVERT",
        "LONGMODE-DATAXFER",
        "LONGMODE-POP",
        "LONGMODE-PUSH",
        "LONGMODE-SEMAPHORE",
        "MMX-MMX",
        "MMX-LOGICAL",
        "MMX-DATAXFER",
        "SSE2-MMX",
        "SSE3-MMX",
        "SSSE3-MMX",
        "SSE-CONVERT",
        "SSE-DATAXFER",
        "SSE-MISC",
        "SSE-PREFETCH",
        "SSE-SSE",
        "SSE2-CONVERT",
        "SSE2-DATAXFER",
        "SSE2-LOGICAL",
        "SSE2-MISC",
        "SSE2-SSE",
        "SSE3-DATAXFER",
        "SSE3-SSE",
        "SSSE3-SSE",
        "SSE4-LOGICAL",
        "SSE4-SSE",
        "AVX-AVX",
        "AVX-BROADCAST",
        "AVX-DATAXFER",
        "AVX-LOGICAL",
        "AVX-STTNI",
        "AVX2-AVX2",
        "AVX2-BROADCAST",
        "AVX2-DATAXFER",
        "AVX2-LOGICAL",
        "AES-AES",
        "AVXAES-AES",
        "BMI1-BMI1",
        "BMI2-BMI2",
        "MOVBE-DATAXFER",
        "LZCNT-LZCNT",
        "PCLMULQDQ-PCLMULQDQ",
    ],
}

# by default, we always handle page faults
_handled_faults: List[str] = ["PF"]

x86_executor_enable_prefetcher: bool = False
""" x86_executor_enable_prefetcher: enable all prefetchers"""
x86_executor_enable_ssbp_patch: bool = True
""" x86_executor_enable_ssbp_patch: enable a patch against Speculative Store Bypass"""
x86_enable_hpa_gpa_collisions: bool = False
""" x86_enable_hpa_gpa_collisions: enable collisions between HPA and GPA;
useful for testing Foreshadow-like leaks"""
x86_disable_div64: bool = True
""" x86_disable_div64: do not generate 64-bit division instructions """
x86_generator_align_locks: bool = True
""" x86_generator_align_locks: align all generated locks to 8 bytes """

instruction_categories: List[str] = ["BASE-BINARY", "BASE-BITBYTE", "BASE-COND_BR"]
""" instruction_categories: a default list of tested instruction categories """

_buggy_instructions: List[str] = [
    "sti",  # enables interrupts
    "cli",  # disables interrupts; blocked just in case
    "xlat",  # requires support of segment registers
    "xlatb",  # requires support of segment registers
    "cmpxchg8b",  # known bug: doesn't execute the mem. access hook
    "lock cmpxchg8b",  # https://github.com/unicorn-engine/unicorn/issues/990
    "cmpxchg16b",  # known bug: doesn't execute the mem. access hook
    "lock cmpxchg16b",  # https://github.com/unicorn-engine/unicorn/issues/990
    "cpuid",  # causes false positives: the model and the CPU will likely have different values
    "cmpps",  # causes crash
    "cmpss",  # causes crash
    'cmppd',  # causes crash
    'cmpsd',  # causes crash
    'movq2dq',
    'movdq2q',
    'rcpps',  # incorrect emulation
    'rcpss',  # incorrect emulation
    #
    'pcmpestriq',  # conflicting operand size modifiers
    'pcmpestrmq',  # conflicting operand size modifiers
    'vpcmpestriq',  # conflicting operand size modifiers
    'vpcmpestrmq',  # conflicting operand size modifiers
    #
    'maskmovdqu',  # non-temp
    'maskmovq',  # non-temp
    'vmaskmovdqu',  # non-temp
    'vmaskmovq',  # non-temp
]

instruction_blocklist: List[str] = [
    # Hard to fix:
    # - Requires complex instrumentation
    "enterw", "enter", "leavew", "leave",
    # - requires support of all possible interrupts
    "int",
    # - system management instruction
    "encls", "vmxon", "stgi", "skinit", "ldmxcsr", "stmxcsr",

    # - not supported
    "lfence", "mfence", "sfence", "clflush", "clflushopt",

    # - under construction
    # -- trigger FPVI (we have neither a contract nor an instrumentation for it yet)
    "divps", "divss", 'divpd', 'divsd',
    "mulss", "mulps", 'mulpd', 'mulsd',
    "rsqrtps", "rsqrtss", "sqrtps", "sqrtss", 'sqrtpd', 'sqrtsd',
    'addps', 'addss', 'addpd', 'addsd',
    'subps', 'subss', 'subpd', 'subsd',
    'addsubpd', 'addsubps', 'haddpd', 'haddps', 'hsubpd', 'hsubps',
]  # yapf: disable
instruction_blocklist.extend(_buggy_instructions)

# x86 executor internally uses R8...R15, RSP, RBP and, thus, they are excluded
# segment registers are also excluded as we don't support their handling so far
# same for CR* and DR*
register_blocklist: List[str] = [
    # free - rax, rbx, rcx, rdx, rdi, rsi
    'r8', 'r9', 'r10', 'r11', 'r12', 'r13', 'r14', 'r15', 'rsp', 'rbp',
    'r8d', 'r9d', 'r10d', 'r11d', 'r12d', 'r13d', 'r14d', 'r15d', 'esp', 'ebp',
    'r8w', 'r9w', 'r10w', 'r11w', 'r12w', 'r13w', 'r14w', 'r15w', 'sp', 'bp',
    'r8b', 'r9b', 'r10b', 'r11b', 'r12b', 'r13b', 'r14b', 'r15b', 'spl', 'bpl',
    'es', 'cs', 'ss', 'ds', 'fs', 'gs',
    'cr0', 'cr2', 'cr3', 'cr4', 'cr8',
    'dr0', 'dr1', 'dr2', 'dr3', 'dr4', 'dr5', 'dr6', 'dr7',
    "xcr0", "gdtr", "ldtr", "idtr", "tr", "fsbase", "gsbase", "msrs", "x87control", "tsc", "tscaux",
    "mxcsr",

    # XMM8-15 are somehow broken in Unicorn
    "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15",
    "ymm8", "ymm9", "ymm10", "ymm11", "ymm12", "ymm13", "ymm14", "ymm15",
]  # yapf: disable


_generator_fault_to_fault_name = {
    'div-by-zero': "DE",
    'div-overflow': "DE",
    'opcode-undefined': "UD",
    'breakpoint': "BP",
    'debug-register': "DB",
    'non-canonical-access': "GP",
    'user-to-kernel-access': "PF",
    'page-fault': "PF"
}

_actor_default = {
    'name': "main",
    'mode': "host",
    'privilege_level': "kernel",
    'observer': False,
    'data_properties': {
        'present': True,
        'writable': True,
        'user': False,
        'write-through': False,
        'cache-disable': False,
        'accessed': True,
        'dirty': True,
        'executable': False,
        'reserved_bit': False,
        'randomized': False,
    },
    'data_ept_properties': {
        'present': True,
        'writable': True,
        'executable': False,
        'accessed': True,
        'dirty': True,
        'user': False,
        'reserved_bit': False,
        'randomized': False,
    },
    'instruction_blocklist': set(),
    'fault_blocklist': set(),
}


================================================
FILE: rvzr/arch/x86/executor.py
================================================
"""
File: Implementation of executor for x86 architecture

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import Dict, Final

from rvzr.executor import Executor, km_write
from rvzr.config import CONF, ConfigException
from rvzr.target_desc import TargetDesc

FAULT_IDS: Final[Dict[str, int]] = {
    'DE': 0,
    'DB': 1,
    'NMI': 2,
    'BP': 3,
    'OF': 4,
    'BR': 5,
    'UD': 6,
    'NM': 7,
    'DF': 8,
    'OLD_MF': 9,
    'TS': 10,
    'NP': 11,
    'SS': 12,
    'GP': 13,
    'PF': 14,
    'SPURIOUS': 15,
    'MF': 16,
    'AC': 17,
    'MC': 18,
    'XF': 19,
    'IRET': 32
}


class X86Executor(Executor):
    """ Base x86 implementation of the executor """

    def __init__(self, enable_mismatch_check_mode: bool = False):
        self._handled_faults_bitmap: int = self._identify_handled_faults()
        super().__init__(enable_mismatch_check_mode)

    def _set_vendor_specific_features(self) -> None:
        km_write("1" if getattr(CONF, 'x86_executor_enable_ssbp_patch') else "0",
                 "/sys/rvzr_executor/enable_ssbp_patch")
        km_write("1" if getattr(CONF, 'x86_executor_enable_prefetcher') else "0",
                 "/sys/rvzr_executor/enable_prefetcher")
        km_write("1" if getattr(CONF, 'x86_enable_hpa_gpa_collisions') else "0",
                 "/sys/rvzr_executor/enable_hpa_gpa_collisions")
        km_write(str(self._handled_faults_bitmap), "/sys/rvzr_executor/handled_faults")

    def _identify_handled_faults(self) -> int:
        handled_faults_bitmap = 0
        for fault in CONF._handled_faults:  # type: ignore  # pylint: disable=protected-access
            if fault in FAULT_IDS:
                handled_faults_bitmap |= (1 << FAULT_IDS[fault])
        return handled_faults_bitmap


class X86IntelExecutor(X86Executor):
    """ Intel-specific implementation of the executor """

    def __init__(self, enable_mismatch_check_mode: bool = False):
        super().__init__(enable_mismatch_check_mode)
        self._vendor = TargetDesc.get_vendor()
        if self._vendor != "Intel":
            raise ConfigException(
                "Attempting to run Intel executor on a non-Intel CPUs!\n"
                "Change the `executor` configuration option to the appropriate vendor value.")


class X86AMDExecutor(X86Executor):
    """ AMD-specific implementation of the executor """

    def __init__(self, enable_mismatch_check_mode: bool = False):
        super().__init__(enable_mismatch_check_mode)
        self._vendor = TargetDesc.get_vendor()
        if self._vendor != "AMD":
            raise ConfigException(
                "Attempting to run AMD executor on a non-AMD CPUs!\n"
                "Change the `executor` configuration option to the appropriate vendor value.")


================================================
FILE: rvzr/arch/x86/fuzzer.py
================================================
"""
File: x86 implementation of the test case generator

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import List, Generator, TYPE_CHECKING
from contextlib import contextmanager
import tempfile
import os

from rvzr.fuzzer import Fuzzer, ArchitecturalFuzzer, ArchDiffFuzzer, FuzzingMode
from rvzr.traces import HTrace
from rvzr.executor import Executor
from rvzr.tc_components.test_case_data import InputData
from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.logs import warning
from rvzr.stats import FuzzingStats
from rvzr.config import CONF
from .config import _buggy_instructions
from .executor import X86IntelExecutor

if TYPE_CHECKING:
    from rvzr.isa_spec import InstructionSet
    from rvzr.asm_parser import AsmParser
    from rvzr.elf_parser import ELFParser
    from rvzr.code_generator import CodeGenerator

STAT = FuzzingStats()


# ==================================================================================================
# X86-specific Implementation of the Fuzzer
# ==================================================================================================
class X86Fuzzer(Fuzzer):
    """
    Implementation of the standard fuzzing mode for the x86 architecture.

    Extends the generic Fuzzer class with:
    1. Checking of the instruction set for compatibility with the required faults
    2. Filtering of non-useful test cases with a Speculation Filter and an Observation Filter
    """

    executor: X86IntelExecutor

    # ----------------------------------------------------------------------------------------------
    # Public Interface
    def start(self, num_test_cases: int, num_inputs: int, timeout: int, nonstop: bool,
              save_violations: bool, type_: FuzzingMode) -> bool:
        _check_instruction_list(self._isa_spec)
        return super().start(num_test_cases, num_inputs, timeout, nonstop, save_violations, type_)

    # ----------------------------------------------------------------------------------------------
    # Private Methods
    def _filter(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        """
        This function implements a multi-stage algorithm that gradually filters out
        uninteresting test cases

        :param test_case: the target test case
        :param inputs: list of inputs to be tested
        :return: True if the test case should be filtered out; False otherwise
        """
        # Exit if all filters are disabled
        if not CONF.enable_speculation_filter and not CONF.enable_observation_filter:
            return False

        # Number of repetitions for each input
        reps = CONF.executor_filtering_repetitions

        with _quick_and_dirty_mode(self.executor):  # Speed up the execution by disabling some
            # Collect hardware traces for the test case
            try:
                self.executor.load_test_case(test_case)
                org_htraces = self.executor.trace_test_case(inputs, reps)
            except IOError:
                return True

            if self._speculation_filter(org_htraces):
                return True

            if self._observation_filter(test_case, inputs, reps, org_htraces):
                return True

            return False

    @staticmethod
    def _speculation_filter(htraces: List[HTrace]) -> bool:
        """
        Execute on the test case on the HW and monitor PFCs
        if there are no mispredictions, this test case is unlikely
        to produce a violation, so just move on to the next one
        :param htraces: list of HTrace objects collected while executing the test case
        :return: True if the test case should be filtered out; False otherwise
        """
        if not CONF.enable_speculation_filter:
            return False

        for _, htrace in enumerate(htraces):
            pfc_values = htrace.get_max_pfc()
            if pfc_values[0] == 0:  # zero indicates an error; filtering is not possible
                return False
            if pfc_values[0] > pfc_values[1] or pfc_values[2] > 0:
                return False
        STAT.spec_filter += 1
        return True

    def _observation_filter(self, test_case: TestCaseProgram, inputs: List[InputData], reps: int,
                            org_htraces: List[HTrace]) -> bool:
        """
        Check if any of the htraces contain a speculative cache eviction
        for this create a fenced version of the test case and collect traces for it
        :param test_case: the target test case
        :param inputs: list of inputs to be tested
        :param reps: number of repetitions for each input
        :param org_htraces: list of HTrace objects collected while executing the test case
        :return: True if the test case should be filtered out; False otherwise
        """
        if not CONF.enable_observation_filter:
            return False

        with tempfile.NamedTemporaryFile(delete=False) as fenced:
            fenced_name = fenced.name
        fenced_test_case = _create_fenced_test_case(test_case.asm_path(), fenced_name,
                                                    self.asm_parser, self.code_gen, self.elf_parser)
        try:
            self.executor.load_test_case(fenced_test_case)
            fenced_htraces = self.executor.trace_test_case(inputs, reps)
        except IOError:
            return True  # skip the test case if there is an error
        os.remove(fenced.name)

        traces_match = True
        for i, _ in enumerate(inputs):
            if not self.analyser.htraces_are_equivalent(fenced_htraces[i], org_htraces[i]):
                traces_match = False
                break
        if traces_match:
            STAT.observ_filter += 1
            return True

        return False

    def _adjust_config(self, existing_test_case: str) -> None:
        super()._adjust_config(existing_test_case)
        _update_instruction_list()


# ==================================================================================================
# Non-standard Fuzzers
# ==================================================================================================
class X86ArchitecturalFuzzer(ArchitecturalFuzzer):
    """
    X86-specific implementation of the ArchitecturalFuzzer.
    Essentially the same as the generic ArchitecturalFuzzer, but with some additional checks
    on the instruction set
    """

    def _adjust_config(self, existing_test_case: str) -> None:
        super()._adjust_config(existing_test_case)
        _update_instruction_list()

    def start(self, num_test_cases: int, num_inputs: int, timeout: int, nonstop: bool,
              save_violations: bool, type_: FuzzingMode) -> bool:
        _check_instruction_list(self._isa_spec)
        return super().start(num_test_cases, num_inputs, timeout, nonstop, save_violations, type_)


class X86ArchDiffFuzzer(ArchDiffFuzzer):
    """
    Fuzzer that compares the execution of a test case with and without fences.
    If the results differ, it reports a violation.

    Used to detect architectural bugs caused by speculative execution.
    """

    executor: X86IntelExecutor

    def _adjust_config(self, existing_test_case: str) -> None:
        super()._adjust_config(existing_test_case)
        _update_instruction_list()

    def start(self, num_test_cases: int, num_inputs: int, timeout: int, nonstop: bool,
              save_violations: bool, type_: FuzzingMode) -> bool:
        _check_instruction_list(self._isa_spec)
        return super().start(num_test_cases, num_inputs, timeout, nonstop, save_violations, type_)

    @staticmethod
    def _create_fenced_test_case(original_asm: str, fenced_asm: str, asm_parser: AsmParser,
                                 generator: CodeGenerator,
                                 elf_parser: ELFParser) -> TestCaseProgram:
        return _create_fenced_test_case(original_asm, fenced_asm, asm_parser, generator, elf_parser)


# ==================================================================================================
# Helper functions
# ==================================================================================================
def _update_instruction_list() -> None:
    """
    Remove those instructions that trigger unhandled exceptions.
    This functionality is implemented as a module-level function
    to avoid code duplication between X86Fuzzer and X86ArchitecturalFuzzer
    """
    if 'opcode-undefined' not in CONF.faults_allowlist:
        CONF.instruction_blocklist.extend(["ud", "ud2"])
    if 'breakpoint' not in CONF.faults_allowlist:
        CONF.instruction_blocklist.extend(["int3"])
    if 'debug-register' not in CONF.faults_allowlist:
        CONF.instruction_blocklist.extend(["int1"])


def _check_instruction_list(instruction_set: InstructionSet) -> None:
    """ Check if the instruction set contains the instructions required for the faults """
    all_instruction_names = {i.name for i in instruction_set.instructions}
    if 'div-by-zero' in CONF.faults_allowlist:
        if 'div' not in all_instruction_names and 'idiv' not in all_instruction_names:
            warning("fuzzer", "div-by-zero enabled, but DIV/IDIV instructions are missing")
    if 'div-overflow' in CONF.faults_allowlist:
        if 'div' not in all_instruction_names and 'idiv' not in all_instruction_names:
            warning("fuzzer", "div-overflow enabled, but DIV/IDIV instructions are missing")
    if 'breakpoint' in CONF.faults_allowlist:
        if 'int3' not in all_instruction_names:
            warning("fuzzer", "breakpoint enabled, but INT3 instruction is missing")
    if 'debug-register' in CONF.faults_allowlist:
        if 'int1' not in all_instruction_names:
            warning("fuzzer", "debug-register enabled, but INT1 instruction is missing")

    # Print a warning if the instruction set contains instructions that are known to be problematic
    for inst_name in _buggy_instructions:
        if inst_name in all_instruction_names and CONF.is_generation_enabled():
            warning(
                "fuzzer", f"Instruction {inst_name} is known to cause false positives\n"
                "Consider adding it to instruction_blocklist")


@contextmanager
def _quick_and_dirty_mode(executor: Executor) -> Generator[None, None, None]:
    """
    Context manager that enables us to use quick and dirty mode in the form of `with` statement
    """
    try:
        executor.set_quick_and_dirty(True)
        yield
    finally:
        executor.set_quick_and_dirty(False)


def _create_fenced_test_case(original_asm: str, fenced_asm: str, asm_parser: AsmParser,
                             generator: CodeGenerator, elf_parser: ELFParser) -> TestCaseProgram:
    """ Add fences to all instructions in the test case """
    with open(original_asm, 'r') as f:
        with open(fenced_asm, 'w') as fenced_file:
            lines = f.readlines()
            n_lines = len(lines)

            for i, line in enumerate(lines):
                fenced_file.write(line)
                line = line.strip().lower()

                # no need to add fences after empty lines and comments
                if not line or line[0] == "#":
                    continue

                # adding a fence after a jump instruction breaks assumptions of our asm parser;
                # this is an issue in the parser, and this check is a workaround
                if line[0] == "j" or "loop" in line:
                    continue

                # don't add fences after assembler directives
                if "section" in line \
                   or "syntax" in line \
                   or "function" in line \
                   or "macro" in line:
                    continue

                # stop adding fences after the test case exit
                if "test_case_exit" in line:
                    break

                # adding a fence before the landing pad will mess with the parsing algorithm,
                # and it won't have any meaningful effect anyways. So we skip it
                if i < n_lines and "landing" in lines[i + 1]:
                    continue

                # add fences after all other instructions
                fenced_file.write('lfence\n')

    fenced_test_case = asm_parser.parse_file(fenced_asm, generator, elf_parser)
    return fenced_test_case


================================================
FILE: rvzr/arch/x86/generator.py
================================================
"""
File: x86 implementation of the test case generator

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import math
import re
import random
from copy import deepcopy
from dataclasses import dataclass
from typing import List, Dict, Set, TYPE_CHECKING, Union, Final, Tuple, Callable, Literal
from typing_extensions import assert_never

from rvzr.code_generator import CodeGenerator, Pass, Printer
from rvzr.config import CONF
from rvzr.sandbox import SandboxLayout, DataArea, PAGE_SIZE
from rvzr.instruction_spec import OT, InstructionSpec
from rvzr.tc_components.actor import ActorPL, ActorID
from rvzr.tc_components.instruction import Instruction, Operand, RegisterOp, FlagsOp, \
    MemoryOp, ImmediateOp, AgenOp, copy_op_with_flow_modification, \
    copy_inst_with_modification
from rvzr.tc_components.test_case_code import TestCaseProgram, BasicBlock, InstructionNode

from .target_desc import X86TargetDesc

if TYPE_CHECKING:
    from rvzr.elf_parser import ELFParser
    from rvzr.asm_parser import AsmParser
    from rvzr.isa_spec import InstructionSet
    from rvzr.target_desc import TargetDesc


# ==================================================================================================
# Private: Fault Type Identification
# ==================================================================================================
@dataclass
class _FaultFilter:
    """ Local service class that identifies which faults are allowed in test cases. """

    def __init__(self) -> None:
        self.div_by_zero: bool = 'div-by-zero' in CONF.faults_allowlist
        self.div_overflow: bool = 'div-overflow' in CONF.faults_allowlist
        self.non_canonical_access: bool = 'non-canonical-access' in CONF.faults_allowlist
        self.u2k_access: bool = 'user-to-kernel-access' in CONF.faults_allowlist


# ==================================================================================================
# Private: Assembly Printing
# ==================================================================================================
class _X86Printer(Printer):
    target_desc: X86TargetDesc

    def __init__(self, target_desc: X86TargetDesc) -> None:
        super().__init__(target_desc)
        self.prologue_template = [".intel_syntax noprefix\n"]
        self.epilogue_template = [
            ".section .data.main\n",
            ".test_case_exit:nop\n",
        ]

    def _instruction_to_str(self, inst: Instruction) -> str:
        if inst.name == "macro":
            return self._macro_to_str(inst)

        operands = ", ".join([self._operand_to_str(op) for op in inst.operands])
        if inst.is_instrumentation:
            comment = "# instrumentation"
        elif inst.is_noremove:
            comment = "# noremove"
        else:
            comment = ""
        return f"{inst.name} {operands} {comment}"

    def _operand_to_str(self, op: Operand) -> str:
        if isinstance(op, (MemoryOp, AgenOp)):
            prefix = self.target_desc.memory_addr_prefixes[op.width]
            return f"{prefix} [{op.value}]"

        return op.value

    def _macro_to_str(self, inst: Instruction) -> str:
        macro_placeholder = "nop qword ptr [rax + 0xff]"
        if inst.operands[1].value.lower() == ".noarg":
            return f".macro{inst.operands[0].value}: {macro_placeholder}"
        return f".macro{inst.operands[0].value}{inst.operands[1].value}: {macro_placeholder}"


# ==================================================================================================
# Private: Collection of Instrumentation Passes
# ==================================================================================================
class _X86NonCanonicalAddressPass(Pass):
    """
    A pass that selects a random memory access instruction and replaces it with an access to a
    non-canonical address.
    """
    _target_desc: X86TargetDesc

    def __init__(self, target_desc: X86TargetDesc) -> None:
        super().__init__()
        self._target_desc = target_desc

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        for bb in test_case.iter_basic_blocks():
            memory_instructions = []
            for node in bb.iter_nodes():
                instr = node.instruction
                if instr.is_instrumentation or instr.is_from_template:
                    continue
                if instr.name in ["div", "idiv"]:
                    # Instrumentation is difficult to combine
                    continue
                if instr.has_mem_operand(True):
                    memory_instructions.append(node)

            # instrument random memory access instructions
            for node in memory_instructions:
                n = len(memory_instructions)
                rand_bool = random.randint(0, n) == 0
                if not rand_bool:
                    continue
                self._instrument(node, bb)

                # Make sure #GP happens only once. Otherwise Unicorn keeps raising an exception
                # when rolling back to the end of the code
                return

    def _instrument(self, node: InstructionNode, parent: BasicBlock) -> None:
        """ Instrument a selected memory access instruction to make the access non-canonical. """
        # pylint: disable = too-many-locals
        # NOTE: That's a fairly complex instrumentation, so the number of locals is justified
        instr = node.instruction

        # Collect src operands
        src_operands = []
        for o in instr.get_src_operands():
            if isinstance(o, RegisterOp):
                src_operands.append(o)

        # Check if the instrumentation is possible
        mem_operands = instr.get_mem_operands(include_explicit=True)
        implicit_mem_operands = \
            instr.get_mem_operands(include_explicit=False, include_implicit=True)
        if not mem_operands or implicit_mem_operands:
            return  # this instruction is hard to instrument; skip

        # Find registers suitable for the instrumentation
        assert len(mem_operands) == 1, f"Unexpected instruction format {instr.name}"
        mem_operand: Operand = mem_operands[0]
        mask_reg = self._find_mask_register(src_operands)
        offset_reg = self._find_offset_register(instr)

        # Generate a random mask to make the address non-canonical
        mask = hex((random.getrandbits(16) << 48))

        # Add the instrumentation sequence:
        #  lea offset_reg, [mem_operand]
        #  mov mask_reg, mask
        #  xor offset_reg, mask_reg
        lea = Instruction("lea", is_instrumentation=True) \
            .add_op(RegisterOp(offset_reg, 64, False, True)) \
            .add_op(MemoryOp(mem_operand.value, 64, True, False))
        parent.insert_before(node, lea)
        mov = Instruction("mov", is_instrumentation=True) \
            .add_op(RegisterOp(mask_reg, 64, True, True)) \
            .add_op(ImmediateOp(mask, 64))
        parent.insert_before(node, mov)
        mask_inst = Instruction("xor", is_instrumentation=True) \
            .add_op(RegisterOp(offset_reg, 64, True, True)) \
            .add_op(RegisterOp(mask_reg, 64, True, False))
        parent.insert_before(node, mask_inst)

        # Update the memory operand
        for idx, op in enumerate(instr.operands):
            if op == mem_operand:
                old_op = instr.operands[idx]
                assert isinstance(old_op, MemoryOp)
                addr_op = MemoryOp(offset_reg, old_op.width, old_op.src, old_op.dest)
                instr.operands[idx] = addr_op

    def _find_mask_register(self, src_operands: List[RegisterOp]) -> str:
        # Do not overwrite offset register with mask
        candidate_list = ["rax", "rbx"]
        mask_reg = candidate_list[0]
        for operands in src_operands:
            op_regs = re.split(r'\+|-|\*| ', operands.value)
            for reg in op_regs:
                if self._target_desc.reg_normalized[mask_reg] == \
                   self._target_desc.reg_normalized[reg]:
                    mask_reg = candidate_list[1]
        return mask_reg

    def _find_offset_register(self, inst: Instruction) -> str:
        # Do not reuse destination register
        candidate_list = ["rcx", "rdx"]
        offset_reg = candidate_list[0]
        for op in inst.get_all_operands():
            if not isinstance(op, RegisterOp):
                continue
            if self._target_desc.reg_normalized[offset_reg] == \
               self._target_desc.reg_normalized[op.value]:
                offset_reg = candidate_list[1]
        return offset_reg


class _X86U2KAccessPass(Pass):
    """
    User-to-Kernel Access Instrumentation Pass.

    This pass instruments user-privilege actors to perform memory accesses targeting
    the kernel actor's (actor 0) FAULTY data area. This creates cross-privilege-level
    memory access patterns useful for detecting CPU vulnerabilities like Meltdown.

    The pass randomly selects memory access instructions in user actors and modifies
    their memory operands to access kernel memory by calculating and applying a fixed
    offset based on the sandbox memory layout.

    IMPORTANT: This pass must run after _X86SandboxPass because it modifies the
    sandboxing instrumentation to ensure memory accesses target a single page.
    """

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Identify and instrument memory accesses in user-privilege actors.

        :param test_case: The test case to process
        """
        # Use enumeration order as actor ID
        # FIXME: This is potentially fragile as it assumes that the sections in the binary
        # will be ordered the same way as the actors were defined in the test case, which
        # may not always hold true. However, we cannot get the actual section ID here because
        # the assembly is not yet generated, so there is nothing to assemble. It's a chicken-and-egg
        # problem. Thus, for now, we have to rely on this assumption.
        for sec_id, sec in enumerate(test_case):
            owner = sec.owner
            # Only instrument user-privilege actors (kernel accesses don't trigger Meltdown)
            if owner.privilege_level != ActorPL.USER:
                continue

            for func in sec:
                to_instrument: List[InstructionNode] = []
                for bb in func:
                    for node in bb.iter_nodes():
                        instr = node.instruction
                        # Skip instrumentation code and template code
                        if instr.is_instrumentation or instr.is_from_template:
                            continue
                        # Skip div/idiv as instrumentation interferes with their operand constraints
                        if instr.name in ["div", "idiv"]:
                            continue
                        if instr.has_mem_operand(False):
                            to_instrument.append(node)

                    for node in to_instrument:
                        # Randomly select instructions based on avg_mem_accesses config
                        probability = 1 / CONF.avg_mem_accesses
                        if random.random() > probability:
                            continue

                        self._instrument(node, bb, sec_id)

    def _instrument(self, node: InstructionNode, _: BasicBlock, owner_id: ActorID) -> None:
        """
        Modify a memory access instruction to target kernel memory instead of user memory.
        :param node: The instruction node to instrument
        :param _: The parent basic block (unused)
        :param owner_id: The actor ID of the instruction's owner (used for offset calculation)
        """
        instr = node.instruction

        # Calculate the memory offset from user's MAIN area to kernel's FAULTY area.
        # We use a dummy SandboxLayout with base (0,0) to compute the relative offset
        # between the two memory regions based on their positions in the sandbox layout.
        layout = SandboxLayout((0, 0), owner_id)
        user_main_start = layout.get_data_addr(DataArea.MAIN, owner_id)
        kernel_faulty_start = layout.get_data_addr(DataArea.FAULTY, 0)
        offset = user_main_start - kernel_faulty_start

        # Select which memory operand to modify (random if instruction has multiple)
        mem_operands: List[MemoryOp] = instr.get_mem_operands(True)
        if len(mem_operands) == 1:
            mem_operand = mem_operands[0]
        else:
            mem_operand = random.choice(mem_operands)

        # Redirect the memory access to kernel memory by subtracting the offset
        mem_operand.value += " - " + str(offset)

        # Adjust sandboxing masks added by X86SandboxPass to target a single page.
        # X86SandboxPass adds AND instructions to mask memory addresses to stay within
        # the actor's data sandbox. We need to reduce these masks to PAGE_SIZE to ensure
        # the cross-privilege access targets only the kernel's FAULTY page.
        previous_node = node.previous
        while previous_node and previous_node.instruction.is_instrumentation:
            for op in previous_node.instruction.operands:
                if not isinstance(op, ImmediateOp):
                    continue
                mask_value = int(op.value, base=0)
                if mask_value > PAGE_SIZE:
                    mask_value %= PAGE_SIZE
                op.value = bin(mask_value)
            previous_node = previous_node.previous


_DispatcherKey = Literal["memory", "division", "bit_test", "repeated", "corrupted_cf", "enclu"]
_SandboxDispatcher = Dict[_DispatcherKey, Tuple[List[InstructionNode],
                                                Callable[[InstructionNode, BasicBlock], None]]]


class _X86SandboxPass(Pass):
    """
    A pass that instruments the test case to prevent certain types of faults,
    including:
    - division by zero
    - division overflow
    - out-of-sandbox memory accesses
    - CF corruption
    - invalid ENCLU operands
    """

    mask_3bits = "0b111"
    bit_test_names = ["bt", "btc", "btr", "bts", "lock bt", "lock btc", "lock btr", "lock bts"]

    def __init__(self, target_desc: TargetDesc, faults: _FaultFilter) -> None:
        super().__init__()
        self.target_desc = target_desc
        self.faults = faults

        size_of_directly_accessible_memory = SandboxLayout.data_area_size(DataArea.MAIN) \
            + SandboxLayout.data_area_size(DataArea.FAULTY)
        mask_width = int(math.log(size_of_directly_accessible_memory, 2))
        self.sandbox_address_mask = "0b" + "1" * mask_width

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        dispatcher: _SandboxDispatcher = {
            "memory": ([], self._sandbox_memory_access),
            "division": ([], self._sandbox_division),
            "bit_test": ([], self._sandbox_bit_test),
            "repeated": ([], self._sandbox_repeated_instruction),
            "corrupted_cf": ([], self._sandbox_corrupted_cf),
            "enclu": ([], self._sandbox_enclu),
        }

        for bb in test_case.iter_basic_blocks():
            dispatcher["memory"][0].clear()
            dispatcher["division"][0].clear()
            dispatcher["bit_test"][0].clear()
            dispatcher["repeated"][0].clear()
            dispatcher["corrupted_cf"][0].clear()
            dispatcher["enclu"][0].clear()

            # collect all instructions that require sandboxing
            for node in bb.iter_nodes():
                inst = node.instruction
                if inst.is_instrumentation or inst.is_from_template:
                    continue

                if inst.has_mem_operand(True):
                    dispatcher["memory"][0].append(node)
                if inst.name in ["div", "rex div", "idiv", "rex idiv"]:
                    dispatcher["division"][0].append(node)
                elif inst.name in self.bit_test_names:
                    dispatcher["bit_test"][0].append(node)
                elif "rep" in inst.name:
                    dispatcher["repeated"][0].append(node)
                elif inst.category in ["BASE-ROTATE", "BASE-SHIFT"]:
                    dispatcher["corrupted_cf"][0].append(node)
                elif inst.name == "enclu":
                    dispatcher["enclu"][0].append(node)

            # sandbox them
            for _, (nodes, sandbox_func) in dispatcher.items():
                for node in nodes:
                    sandbox_func(node, bb)

    def _sandbox_memory_access(self, node: InstructionNode, parent: BasicBlock) -> None:
        """ Force the memory accesses into the page starting from R14 """
        instr = node.instruction

        mem_operands = instr.get_mem_operands(True)
        implicit_mem_operands = instr.get_mem_operands(
            include_explicit=False, include_implicit=True)

        mask = self.sandbox_address_mask
        if any(op.width >= 256 for op in mem_operands):
            mask = mask[:-5] + "0" * 5
        elif any(op.width >= 128 for op in mem_operands):
            mask = mask[:-4] + "0" * 4

        # FIXME: broken type
        if CONF.x86_generator_align_locks:  # type: ignore  # pylint: disable = no-member
            if "lock" in instr.name or instr.name == "xchg":
                mask = mask[:-3] + "0" * 3

        if mem_operands and not implicit_mem_operands:
            assert len(mem_operands) == 1, \
                f"Instructions with multiple memory accesses are not yet supported: {instr.name}"
            mem_operand = mem_operands[0]
            address_reg = mem_operand.value
            imm_width = mem_operand.width if mem_operand.width <= 32 else 32
            apply_mask = Instruction("and", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, 64, True, True)) \
                .add_op(ImmediateOp(mask, imm_width)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, apply_mask)
            instr.get_mem_operands(True)[0].value = "r14 + " + address_reg
            return

        mem_operands = implicit_mem_operands
        assert mem_operands, "Attempt to sandbox an instruction without memory operands"

        # deduplicate operands
        uniq_operands: Dict[str, MemoryOp] = {}
        for o in mem_operands:
            if o.value not in uniq_operands:
                uniq_operands[o.value] = o

        # instrument each operand to sandbox the memory accesses
        for address_reg, mem_operand in uniq_operands.items():
            imm_width = mem_operand.width if mem_operand.width <= 32 else 32
            assert address_reg in self.target_desc.registers_by_size[64], \
                f"Unexpected address register {address_reg} used in {instr}"
            apply_mask = Instruction("and", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, mem_operand.width, True, True)) \
                .add_op(ImmediateOp(mask, imm_width)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, apply_mask)

            add_base = Instruction("add", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, mem_operand.width, True, True)) \
                .add_op(RegisterOp("r14", 64, True, False)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, add_base)

            # restore the original register value
            remove_base = Instruction("sub", is_instrumentation=True) \
                .add_op(RegisterOp(address_reg, mem_operand.width, True, True)) \
                .add_op(RegisterOp("r14", 64, True, False)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_after(node, remove_base)

    def _sandbox_division(self, node: InstructionNode, parent: BasicBlock) -> None:
        """
        In the experiments where division errors are not permitted, we prevent them
        through code instrumentation.
        Specifically, we may need to prevent two types of faults:
        - division by zero
        - division overflow (i.e., quotient is larger than the destination register)

        To prevent div by zero we OR the divider with a non-zero value:
            divisor = divisor | 1

        The mechanism for preventing div overflows depends on the division type:
        * for unsigned division, we first mask the upper half of the dividend with the divisor,
        which makes the quotient at most one bit larger then the destination, and then shift
        the result by one, thus compensating for the last one overflow bit.
            D = (D & divisor) >> 1
        * for signed division, we make set its lower bits to 0b10000, which ensures that
        all positive divider values are larger or equal to 15, and all negative values
        are smaller or equal to -15.
            divisor[0:3] = 0b1000
        We further constraint the division by clearing the sign bit of the dividend.
        Under these two constraints, an overflow is possible only when the dividend
        is larger  or equal to (15 << div_size, e.g., for 32-bit division 15 * (2 ** 32)).
        Since, the dividend is a combination of two registers (D << div_size + A),
        an overflow happens when D is larger or equal to 15. We ensure that it does not
        happen by masking the upper bits of D:
            D = D & 0b11

        There are also two corner cases:
            1) The divisor is D. This case is impossible to resolve, as far as I can tell,
            because our instrumentation would have to modify both the divisor and the dividend
            at the same time. We just give up in this case and delete the instruction.
            2) 8-bit division, when the divisor is the AX register alone.
            Here the instrumentation becomes too complicated, so we simply set AX to 1.

        This instrumentation has a side effect of reducing the entropy of the division operands:
        For unsigned division:
            * entropy of the divisor is reduced by 1 bit
            * entropy of D is reduced by (divisor_value_size + 1) bits
        For signed division:
            * entropy of the divisor is reduced by 4 bits
            * entropy of D is reduced by (division_size - 2) bits (i.e., the resulting
              entropy of D is 2 bits, with the sign bit cleared)
        """
        # pylint: disable = too-many-locals
        # FIXME: this function has to be refactored to break it down into simpler parts

        inst = node.instruction

        # Determine what type of fault is allowed
        owner_name = parent.get_owner().name
        actor_blocklist = CONF.get_actors_conf()[owner_name]["fault_blocklist"]
        enable_div_by_zero = self.faults.div_by_zero & ("div-by-zero" not in actor_blocklist)
        enable_div_overflow = self.faults.div_overflow & ("div-overflow" not in actor_blocklist)

        # Copy div source operand and label it as a destination; we may need to modify it
        operand = inst.operands[0]
        assert isinstance(operand, (RegisterOp, MemoryOp)), \
               f"Unexpected operand type {operand}"
        divisor = copy_op_with_flow_modification(operand, dest=True)
        size = divisor.width

        # This option prevents triggering of Zero Division Injection in the tests
        # FIXME: Broken type hint
        if size == 64 and CONF.x86_disable_div64:  # type: ignore  # pylint: disable = no-member
            parent.delete(node)
            return

        # Prevent div by zero
        if not enable_div_by_zero:
            if "idiv" not in inst.name or enable_div_overflow:
                # for unsigned division and signed divisions with overflow permitted,
                # it is sufficient to OR the divisor with 1 to prevent div by zero
                instrumentation = Instruction("or", is_instrumentation=True) \
                    .add_op(divisor) \
                    .add_op(ImmediateOp("1", 8)) \
                    .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
                parent.insert_before(node, instrumentation)
            else:
                # for signed divisions with overflows forbidden,
                # we need to modify the divisor to make it both non-zero
                # and large enough to avoid overflows.
                # We have two cases here, positive and negative divider values:

                # For positive dividers, we OR the divisor with 0b10000 to make sure
                # that the divider is at least 15
                # (the value 15 comes from the instrumentation below, where
                # we make the dividend at most `4 << div_size - 1`)
                instrumentation = Instruction("or", is_instrumentation=True) \
                    .add_op(divisor) \
                    .add_op(ImmediateOp("0b1000", 8)) \
                    .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
                parent.insert_before(node, instrumentation)

                # For negative dividers, we clear the lower 4 bits of the divider,
                # thus making the value at most -15. To this end, we AND
                # the lower 8 bits of the divider bit a bit mask 0b11110000
                divider_8_bit: Union[RegisterOp, MemoryOp]
                if isinstance(divisor, MemoryOp):
                    divider_8_bit = MemoryOp(divisor.value, 8, divisor.src, divisor.dest)
                elif isinstance(divisor, RegisterOp):
                    reg_normalized = self.target_desc.reg_normalized[divisor.value]
                    reg_8_bit = self.target_desc.reg_denormalized[reg_normalized][8]
                    divider_8_bit = RegisterOp(reg_8_bit, 8, divisor.src, divisor.dest)
                else:
                    assert_never(divisor)

                instrumentation = Instruction("and", is_instrumentation=True) \
                    .add_op(divider_8_bit) \
                    .add_op(ImmediateOp("0b11111000", 8)) \
                    .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
                parent.insert_before(node, instrumentation)

        if enable_div_overflow:
            return
        # Prevent div overflows:

        # Check for the cases that are impossible to instrument:
        # - division by D register
        # - division by a memory value with the RDX offset
        # - division where AX is both the dividend and the offset in memory
        if divisor.value in ["rdx", "edx", "dx", "dh", "dl"] \
           or "rdx" in divisor.value \
           or ("rax" in divisor.value and size == 8):
            parent.delete(node)
            return

        # Special case: dividend in AX
        # instrumentation: ax = 1
        if size == 8:
            instrumentation = Instruction("mov", is_instrumentation=True).\
                add_op(RegisterOp("ax", 16, False, True)).\
                add_op(ImmediateOp("1", 16))
            parent.insert_before(node, instrumentation)
            return

        # Normal case
        d_register = {64: "rdx", 32: "edx", 16: "dx"}[size]

        # signed div
        if "idiv" in inst.name:
            # it's extremely hard to prevent overflows with large signed divisions
            # that's why we simplify the case by assigning zero to the upper bits of the dividend
            # instrumentation, thus making the dividend at most `4 << div_size - 1`
            # D = D & 3
            instrumentation = Instruction("and", is_instrumentation=True) \
                .add_op(RegisterOp(d_register, size, True, True)) \
                .add_op(ImmediateOp("0b11", 8)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, instrumentation)

        # unsigned div
        else:
            # instrumentation:
            # D = (D & divisor) >> 1  # ensure that D is always smaller than the divisor
            instrumentation = Instruction("and", is_instrumentation=True) \
                .add_op(RegisterOp(d_register, size, True, True)) \
                .add_op(divisor) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, instrumentation)

            instrumentation = Instruction("shr", is_instrumentation=True) \
                .add_op(RegisterOp(d_register, size, True, True)) \
                .add_op(ImmediateOp("1", 8)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "undef")), True)
            parent.insert_before(node, instrumentation)

    def _sandbox_bit_test(self, node: InstructionNode, parent: BasicBlock) -> None:
        """
        The address accessed by a BT* instruction is based on both of its operands.
        `sandbox_memory_access` take care of the first operand.
        This function ensures that the offset is always within a byte.
        """
        inst = node.instruction

        address = inst.operands[0]
        if isinstance(address, RegisterOp):
            # this is a version that does not access memory
            # no need for sandboxing
            return

        offset = inst.operands[1]
        if isinstance(offset, ImmediateOp):
            # The offset is an immediate
            # Simply replace it with a smaller value
            offset.value = str(random.randint(0, 7))
            return

        # The offset is in a register
        assert isinstance(offset, RegisterOp)

        # Mask its upper bits to reduce the stored value to at most 7
        if address.value != offset.value:
            new_offset = copy_op_with_flow_modification(offset, dest=True)
            apply_mask = Instruction("and", is_instrumentation=True) \
                .add_op(new_offset) \
                .add_op(ImmediateOp(self.mask_3bits, 8)) \
                .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
            parent.insert_before(node, apply_mask)
            return

        # Special case: offset and address use the same register
        # Sandboxing is impossible. Give up
        parent.delete(node)

    def _sandbox_repeated_instruction(self, node: InstructionNode, parent: BasicBlock) -> None:
        apply_mask = Instruction("and", is_instrumentation=True) \
            .add_op(RegisterOp("rcx", 64, True, True)) \
            .add_op(ImmediateOp("0xff", 8)) \
            .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
        add_base = Instruction("add", is_instrumentation=True) \
            .add_op(RegisterOp("rcx", 64, True, True)) \
            .add_op(ImmediateOp("1", 1)) \
            .add_op(FlagsOp(("w", "w", "w", "w", "w", "", "", "", "w")), True)
        parent.insert_before(node, apply_mask)
        parent.insert_before(node, add_base)

    def _sandbox_corrupted_cf(self, node: InstructionNode, parent: BasicBlock) -> None:
        # FIXME: This should be a separate pass

        set_cf = Instruction("stc", is_instrumentation=True) \
            .add_op(FlagsOp(("w", "", "", "", "", "", "", "", "")), True)
        parent.insert_after(node, set_cf)

    def _sandbox_enclu(self, node: InstructionNode, parent: BasicBlock) -> None:
        # FIXME: This should be a separate pass
        options = [
            "0",  # ereport
            "1",  # egetkey
            "4",  # eexit
            "5",  # eaccept
            "6",  # emodpe
            "7",  # eacceptcopy
        ]
        set_rax = Instruction("mov", is_instrumentation=True) \
            .add_op(RegisterOp("eax", 32, True, True)) \
            .add_op(ImmediateOp(random.choice(options), 1))
        parent.insert_before(node, set_rax)

    @staticmethod
    def requires_sandbox(inst: InstructionSpec) -> bool:
        """ Check if the instruction requires instrumentation to prevent faults """
        if inst.has_mem_operand:
            return True
        if inst.name in ["div", "rex div"]:
            return True
        if inst.name in ["bt", "btc", "btr", "bts", "lock bt", "lock btc", "lock btr", "lock bts"]:
            return True
        if inst.category in ["BASE-SHIFT", "BASE-ROTATE"]:
            return True
        return False


class _X86PatchUndefinedFlagsPass(Pass):
    """
    Some instructions have undefined effect on FLAGS (e.g., SHL may or may not overwrite OF).
    This causes a mismatch between Model execution and Executor, if the undefined behavior
    is implemented differently. It leads to false positives.
    To prevent them, we analyse the test cases in search for the cases where an instruction
    with undefined flags is followed by an instruction that uses this flag. We then
    insert another random instruction in-between, such that this
    instruction overwrites the undefined flag.

    I.e., we replace
        SHL eax, eax  // undefined OF
        JNO .label    // uses OF
    with
        SHL eax, eax
        ADD ebx, ecx  // random instruction that overwrites OF
        JNO .label
    """
    patch_candidates: List[InstructionSpec]

    def __init__(self, instruction_set: InstructionSet, generator: CodeGenerator) -> None:
        super().__init__()
        self.instruction_set = instruction_set
        self.generator = generator

        self.patch_candidates = []
        for instruction_spec in instruction_set.instructions:
            # we don't want to change the control flow
            if instruction_spec.is_control_flow:
                continue

            # check if the instruction is safe to use on its own
            if _X86SandboxPass.requires_sandbox(instruction_spec):
                continue

            # check if it overwrites flags and if creates new dependencies
            has_read = False
            has_write = False
            for op in instruction_spec.operands + instruction_spec.implicit_operands:
                if op.type == OT.FLAGS:
                    for f in op.values:
                        if f in ['r', 'r/w', 'r/cw']:
                            has_read = True
                        elif f in ['w']:
                            has_write = True
            if not has_read and has_write:
                self.patch_candidates.append(instruction_spec)

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        for bb in test_case.iter_basic_blocks():
            self._patch_flags_in_bb(bb)

    def _patch_flags_in_bb(self, bb: BasicBlock) -> None:
        # pylint: disable = too-many-branches
        # FIXME: This function was written in a hurry and needs to be refactored

        # get a list of all instruction nodes in the BB
        all_instructions: List[InstructionNode] = []
        for node in bb.iter_nodes():
            all_instructions.append(node)

        # Initialize a list used to track the flags that have to be set
        flags_to_set: Set[str] = set()

        # Collect the flags read by the terminators (conditional jumps)
        # Note: we assume that terminators do not modify flags
        # and hence no patching is needed at this point
        for term in bb.terminators:
            flags = term.get_flags_operand()
            if flags:
                for f in flags.get_flags_by_type('read'):
                    flags_to_set.add(f)

        # Walk the instruction list in the reverse order
        # During the walk, track flags have undefined values and overwrite them by adding
        # extra instructions in-between
        while all_instructions:
            node = all_instructions.pop()
            inst = node.instruction
            flags = inst.get_flags_operand()

            # skip template instructions and instructions that do not read/write flags
            if inst.is_from_template or not flags:
                continue

            # fix undefined flags by adding another instruction in-between
            undef_flags = [i for i in flags.get_flags_by_type('undef') if i in flags_to_set]
            if undef_flags:
                patches = self._find_flags_patch(undef_flags, flags_to_set)
                for patch in patches:
                    bb.insert_after(node, patch)
                    # remove the flags overwritten by the patch
                    for f in patch.get_flags_operand().get_flags_by_type('write'):  # type: ignore
                        flags_to_set.discard(f)

            # remove the flags overwritten by the instruction
            for f in flags.get_flags_by_type('write'):
                flags_to_set.discard(f)

            # add new flag dependencies
            for f in flags.get_flags_by_type('read'):
                flags_to_set.add(f)

        # make sure that we do not have undefined flags when we enter the BB
        if flags_to_set:
            # find a place to insert the patches
            entry_node = bb.get_first(exclude_macros=True)
            if not entry_node:
                raise ValueError("X86PatchUndefinedFlagsPass: No place to insert a patch")

            patches = self._find_flags_patch(list(flags_to_set), flags_to_set)
            for patch in patches:
                bb.insert_before(entry_node, patch)

    def _find_flags_patch(self, undef_flags: List[str],
                          flags_to_set: Set[str]) -> List[Instruction]:
        """
        Find an instruction sequence that would overwrite a list of flags
        :param undef_flags: list of undefined flags that have to be overwritten
            by the patch instructions
        :param flags_to_set: list of flags that will be read by one of the following instructions,
            and thus should not be set to the undef state by the patch. This should be always
            a superset of or the same as undef_flags.
        :return: list of instructions that overwrite the undefined flags
        """
        org_undef = deepcopy(undef_flags)
        patches: List[Instruction] = []
        for instruction_spec in self.patch_candidates:
            patch = self.generator.generate_instruction(instruction_spec, True)
            patch_flags = patch.get_flags_operand()
            assert patch_flags
            new_undef_flags = [
                i for i in patch_flags.get_flags_by_type('undef')
                if i not in undef_flags and i in flags_to_set
            ]
            not_patched_flags = [
                i for i in undef_flags if i not in patch_flags.get_flags_by_type('write')
            ]

            if not new_undef_flags and not_patched_flags != undef_flags:
                patches.append(patch)
                undef_flags = not_patched_flags
                if not undef_flags:
                    break

        if undef_flags:
            raise ValueError("Could not find an instruction to patch flags.\n"
                             f"  Initial flags to be patched: {org_undef}\n"
                             f"  Flags for which a patch was not found: {undef_flags}")

        return patches


class _X86PatchUndefinedResultPass(Pass):
    """
    Some instructions have undefined results when the source operand is zero.
    This pass patches such instructions to avoid undefined behavior.
    """

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        # call _patch_bit_scan on all bit scan instructions
        for bb in test_case.iter_basic_blocks():
            bit_scan = []
            for node in bb.iter_nodes():
                inst = node.instruction
                if inst.is_instrumentation or inst.is_from_template:
                    continue
                if inst.name in ["bsf", "bsr"]:
                    bit_scan.append(node)
            for node in bit_scan:
                self._patch_bit_scan(node, bb)

    @staticmethod
    def _patch_bit_scan(node: InstructionNode, parent: BasicBlock) -> None:
        """
        Bit Scan instructions give an undefined result when the source operand is zero.
        To avoid it, set the most significant bit.
        """
        inst = node.instruction

        # get the source operand
        src_operand = inst.operands[1]
        assert isinstance(src_operand, (RegisterOp, MemoryOp)), \
               f"Unexpected operand type {src_operand}"

        # copy because we may modify it
        source = copy_op_with_flow_modification(src_operand, dest=True)

        mask = bin(1 << (source.width - 1))
        mask_size = source.width
        if source.width in [64, 32]:
            mask = "0b1000000000000000000000000000000"
            mask_size = 32
        apply_mask = Instruction("or", is_instrumentation=True) \
            .add_op(source) \
            .add_op(ImmediateOp(mask, mask_size)) \
            .add_op(FlagsOp(("w", "w", "undef", "w", "w", "", "", "", "w")), True)
        parent.insert_before(node, apply_mask)


class _X86PatchOpcodesPass(Pass):
    """
    Replaces assembly instructions with their opcodes.
    This is necessary to test instruction with multiple opcodes and
    the instruction that are not supported/not permitted by the standard
    assembler.
    """
    _OPCODES: Final[Dict[str, List[str]]] = {
        "ud2": [
            "0x0f, 0x0b",  # UD2 instruction
            # invalid in 64-bit mode;
            # all the following opcodes are padded
            # with NOP to prevent misinterpretation by objdump
            "0x06, 0x90",  # 32-bit encoding of PUSH
            "0x07, 0x90",  # 32-bit encoding of POP
            "0x0e, 0x90",  # alternative 32-bit encoding of PUSH
            "0x16, 0x90",  # alternative 32-bit encoding of PUSH
            "0x17, 0x90",  # alternative 32-bit encoding of POP
            "0x1e, 0x90",  # alternative 32-bit encoding of PUSH
            "0x1f, 0x90",  # alternative 32-bit encoding of POP
            "0x27, 0x90",  # DAA
            "0x2f, 0x90",  # DAS
            "0x37, 0x90",  # AAA
            "0x3f, 0x90",  # AAS
            "0x60, 0x90",  # PUSHA
            "0x61, 0x90",  # POPA
            "0x62, 0x90",  # BOUND
            "0x82, 0x90",  # 32-bit aliases for logical instructions
            "0x9a, 0x90",  # 32-bit encoding of CALLF
            "0xc4, 0x90",  # LES
            "0xd4, 0x90",  # AAM
            "0xd5, 0x90",  # AAD
            "0xd6, 0x90",  # reserved
            "0xea, 0x90",  # 32-bit encoding of JMPF
        ],
        "int1": ["0xf1"]
    }

    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        for bb in test_case.iter_basic_blocks():
            # collect all UD instructions
            to_patch = []
            for node in bb.iter_nodes():
                inst = node.instruction
                if inst.is_instrumentation or inst.is_from_template:
                    continue
                if inst.name in self._OPCODES:
                    to_patch.append(node)

            # patch them
            for node in to_patch:
                self._instrument(node, bb)

    def _instrument(self, node: InstructionNode, parent: BasicBlock) -> None:
        inst = node.instruction
        opcode_options = self._OPCODES[inst.name]
        opcode = random.choice(opcode_options)
        new_inst = copy_inst_with_modification(inst, name=".byte " + opcode)
        parent.insert_before(node, new_inst)
        parent.delete(node)


# ==================================================================================================
# Public Interface
# ==================================================================================================
class X86Generator(CodeGenerator):
    """ x86-specific implementation of the test case program generator """

    _faults: _FaultFilter

    def __init__(self, seed: int, instruction_set: InstructionSet, target_desc: TargetDesc,
                 asm_parser: AsmParser, elf_parser: ELFParser) -> None:
        super().__init__(seed, instruction_set, target_desc, asm_parser, elf_parser)
        assert isinstance(self._target_desc, X86TargetDesc)

        self._faults = _FaultFilter()

        # configure instrumentation passes
        self._passes = [
            _X86PatchUndefinedFlagsPass(self._instruction_set, self),
            _X86SandboxPass(self._target_desc, self._faults),
            _X86PatchUndefinedResultPass(),
        ]
        if self._faults.non_canonical_access:
            self._passes.append(_X86NonCanonicalAddressPass(self._target_desc))
        if self._faults.u2k_access:
            self._passes.append(_X86U2KAccessPass())  # must be after X86SandboxPass
        self._passes.append(_X86PatchOpcodesPass())
        self._printer = _X86Printer(self._target_desc)


================================================
FILE: rvzr/arch/x86/get_spec.py
================================================
"""
File: A script that downloads the x86 instruction set from the Side Channel Fuzzer repository
      and parses it into a JSON file that can be used by the generator.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import sys
import json
import subprocess
from typing import List, Optional, Literal
from xml.etree import ElementTree as ET

# ==================================================================================================
# x86-specific constants
# ==================================================================================================
REG_SIZE = {
    "rax": 64,
    "rbx": 64,
    "rcx": 64,
    "rdx": 64,
    "r11": 64,
    "rip": 64,
    "rsp": 64,
    "rbp": 64,
    "eax": 32,
    "ebx": 32,
    "ecx": 32,
    "edx": 32,
    "ax": 16,
    "dx": 16,
    "bp": 16,
    "sp": 16,
    "al": 8,
    "ah": 8,
    "cl": 8,
    "spl": 8,
    "tmm0": 0,
    "mxcsr": 32,
    'es': 16,
    'ss': 16,
    'ds': 16,
    'fs': 16,
    'gs': 16,
    'cr0': 64,
    'cr3': 64,
    'cr4': 64,
    'cr8': 64,
    'xcr0': 64,
    'dr0': 64,
    'dr1': 64,
    'dr2': 64,
    'dr3': 64,
    'dr6': 64,
    'dr7': 64,
    'gdtr': 80,
    'ldtr': 96,
    'idtr': 80,
    'tr': 16,
    'msrs': 64,
    'x87control': 16,
    'x87pop': 16,
    'x87status': 16,
    'tsc': 64,
    "tscaux": 64,
    "fsbase": 64,
    "gsbase": 64,
}
REG_SIZE.update({f"mm{i}": 64 for i in range(8)})
REG_SIZE.update({f"xmm{i}": 128 for i in range(16)})
REG_SIZE.update({f"ymm{i}": 256 for i in range(16)})
# REG_SIZE.update({f"zmm{i}": 512 for i in range(32)})

# A list of instructions that have RIP as an operand but should
# not be considered as control-flow instructions by the generator
NON_CONTROL_FLOW_INST = ["int", "int1", "int3", "into"]

# ==================================================================================================
# Lists of x86 extensions
# ==================================================================================================

# Instructions that can be tested without any repercussions
# This list for our default model backend (Unicorn)
SAFE_EXTENSIONS = [
    "BASE",
    "SSE",
    "SSE2",
    "SSE3",
    "SSE4",
    "SSE4a",
    "CLFLUSHOPT",
    "CLFSH",
    "SSE",
    "RDTSCP",
    "LONGMODE",
]

# Instructions that can be tested without any repercussions
# on the new (experimental) backend, DynamoRIO
SAFE_EXTENSIONS_DR = [
    "3DNOW_PREFETCH",
    "3DNOW",
    "ADOX_ADCX",
    "AES",
    "AVX_VNNI",
    "AVX",
    "AVX2",
    "AVX2GATHER",
    "AVX512EVEX",
    "AVX512VEX",
    "AVXAES",
    "BASE",
    "BMI1",
    "BMI2",
    "CLFLUSHOPT",
    "CLFSH",
    "FMA",
    "FMA4",
    "GFNI",
    "LONGMODE",
    "LZCNT",
    "MCOMMIT",
    "MMX",
    "MOVBE",
    "MOVDIR",
    "PCLMULQDQ",
    "PCONFIG",
    "PKU",
    "PREFETCHWT1",
    "PTWRITE",
    "RDPID",
    "RDPRU",
    "RDRAND",
    "RDSEED",
    "RDWRFSGS",
    "SERIALIZE",
    "SHA",
    "SMAP",
    "SSE",
    "SSE2",
    "SSE3",
    "SSE4",
    "SSE4a",
    "SSSE3",
    "TBM",
    "UINTR",
    "VAES",
    "VPCLMULQDQ",
    "XOP",
]

# Instructions that can potentially crash the system if the fuzzer is misconfigured
ALL_EXTENSIONS = SAFE_EXTENSIONS + [
    "VTX",
    "SVM",
    "SMX",
    "WBNOINVD",
    "XSAVE",
    "XSAVEOPT",
    "XSAVES",
    "SGX",
    "ENQCMD",
    "INVPCID",
    "KEYLOCKER",
    "MONITOR",
    "PAUSE",
    "RDRAND",
    "RDSEED",
    "RDWRFSGS",
    "HRESET",
    "SMAP",
    "AMD_INVLPGB",
    "SNP",
]

# ==================================================================================================
# Internal Classes that represent the parsed XML data
# ==================================================================================================
OP_TYPE = Literal["REG", "MEM", "AGEN", "IMM", "LABEL", "FLAGS"]


class _XMLOperandSpec:
    """
    A class that represents an operand parsed from the XML file
    """
    values: List[str]
    type_: OP_TYPE
    xtype: str
    width: int
    is_signed: bool = True
    comment: str
    src: bool = False
    dest: bool = False
    magic: bool = False

    def to_json(self) -> str:
        """ Converts the operand to a JSON string """
        values_lower = []
        for v in self.values:
            values_lower.append(v.lower())
        self.values = values_lower
        return json.dumps(self, default=vars)


class _XMLInstructionSpec:
    """ A class that represents an instruction parsed from the XML file """
    name: str
    category: str = ""
    is_control_flow: bool = False
    operands: List[_XMLOperandSpec]
    implicit_operands: List[_XMLOperandSpec]

    def __init__(self) -> None:
        self.operands = []
        self.implicit_operands = []

    def __str__(self) -> str:
        return f"{self.name} {self.is_control_flow} {self.category} " \
            f"{len(self.operands)} {len(self.implicit_operands)}"

    def to_json(self) -> str:
        """ Converts the instruction to a JSON string """
        s = "{"
        s += f'"name": "{self.name.lower()}", "category": "{self.category}", '
        s += f'"is_control_flow": {str(self.is_control_flow).lower()},\n'
        s += '  "operands": [\n    '
        s += ',\n    '.join([o.to_json() for o in self.operands])
        s += '\n  ],\n'
        if self.implicit_operands:
            s += '  "implicit_operands": [\n    '
            s += ',\n    '.join([o.to_json() for o in self.implicit_operands])
            s += '\n  ]'
        else:
            s += '  "implicit_operands": []'
        s += "\n}"
        return s


# ==================================================================================================
# Classes that parse the XML file and convert it to JSON
# ==================================================================================================
class _ParseFailed(Exception):
    """ An exception that is raised when parsing fails """


class XMLSpecParser:
    """ A class that parses the XML file and converts it to JSON """
    n_instructions_in_xml: int = 0
    _tree: ET.Element
    _instructions: List[_XMLInstructionSpec]
    _current_spec: _XMLInstructionSpec

    def __init__(self, extensions: List[str]) -> None:
        self.extensions = extensions
        self._instructions = []

    def __len__(self) -> int:
        return len(self._instructions)

    def parse_file(self, filename: str) -> None:
        """ Parsed the XML file and saves a list of _XMLInstructionSpec objects """

        # Get a tree from the XML file
        parser = ET.ElementTree()
        tree = parser.parse(filename)
        if not tree:
            print("No input. Exiting")
            sys.exit(1)
        self._tree = tree
        self.n_instructions_in_xml = len(list(self._tree.iter('instruction')))

        # Check if the requested extensions are available
        self._check_extension_list()

        # Parse all nodes in the tree
        for instruction_node in self._tree.iter('instruction'):
            instruction_spec = self._parse_node(instruction_node)  # pylint: disable=e1128
            if instruction_spec is not None:
                self._instructions.append(instruction_spec)

    def save_as_json(self, filename: str) -> None:
        """ Saves the parsed instructions as a JSON file """
        json_str = "[\n" + ",\n".join([i.to_json() for i in self._instructions]) + "\n]"
        # print(json_str)
        with open(filename, "w+") as f:
            f.write(json_str)

    def _parse_node(self, node: ET.Element) -> Optional[_XMLInstructionSpec]:
        # pylint: disable=too-many-branches  # Justified because it's a parser

        # Check if the node should be skipped
        if self._node_is_not_supported(node):
            return None
        if node.attrib['extension'] not in self.extensions:
            return None

        # Create a new instruction spec
        instruction = _XMLInstructionSpec()

        # Parse instruction attributes
        instruction.category = f"{node.attrib['extension']}-{node.attrib['category']}"
        instruction.name = node.attrib['asm'].removeprefix("{load} ")\
            .removeprefix("{store} ").removeprefix("{disp32} ").lower()

        try:
            for op_node in node.iter('operand'):
                # Create a new operand spec based on the node type
                op_type = op_node.attrib['type']
                if op_type == 'reg':
                    parsed_op = self._parse_reg_operand(op_node)
                elif op_type == 'mem':
                    parsed_op = self._parse_mem_operand(op_node)
                elif op_type == 'agen':
                    op_node.text = node.attrib['agen']
                    parsed_op = self._parse_agen_operand(op_node)
                elif op_type == 'imm':
                    parsed_op = self._parse_imm_operand(op_node)
                elif op_type == 'relbr':
                    parsed_op = self._parse_label_operand(op_node)
                elif op_type == 'flags':
                    parsed_op = self._parse_flags_operand(op_node)
                else:
                    raise _ParseFailed("Unknown operand type " + op_type)

                # Add the operand to the instruction
                if op_node.attrib.get('suppressed', '0') == '1':
                    instruction.implicit_operands.append(parsed_op)
                else:
                    instruction.operands.append(parsed_op)

                # Set additional operand attributes
                if op_node.attrib.get('implicit', '0') == '1':
                    parsed_op.magic = True

                # Set additional instruction attributes based on the operand
                if parsed_op.type_ == "REG":
                    text = getattr(op_node, 'text', '').lower()
                    if text == "rip" and instruction.name not in NON_CONTROL_FLOW_INST:
                        instruction.is_control_flow = True
                elif parsed_op.type_ == "LABEL":
                    instruction.is_control_flow = True

        except _ParseFailed as e:
            # If parsing fails, skip the instruction
            print(f"WARN: Skipping instruction {instruction.name} due to `{e}`")
            return None

        return instruction

    def _node_is_not_supported(self, node: ET.Element) -> bool:
        return node.attrib.get('sae', '') == '1' or \
            node.attrib.get('roundc', '') == '1' or \
            node.attrib.get('zeroing', '') == '1'

    def _parse_reg_operand(self, op: ET.Element) -> _XMLOperandSpec:
        assert op.text is not None

        spec = _XMLOperandSpec()
        spec.type_ = "REG"
        if op.attrib.get('xtype', '') != '':
            spec.xtype = op.attrib.get('xtype', '')

        spec.values = op.text.lower().split(',')
        if spec.values[0] not in REG_SIZE:
            raise _ParseFailed(f"Unsupported register operand {spec.values[0]}")

        spec.src = op.attrib.get('r', "0") == "1"
        spec.dest = op.attrib.get('w', "0") == "1"

        spec.width = int(op.attrib.get('width', 0))
        if spec.width == 0:
            spec.width = REG_SIZE[spec.values[0]]

        return spec

    @staticmethod
    def _parse_mem_operand(op: ET.Element) -> _XMLOperandSpec:
        assert op.attrib is not None

        # asserts are for unsupported instructions
        if op.attrib.get('VSIB', '0') != '0':
            raise _ParseFailed("Vector SIB memory addressing is not supported")
        # assert op.attrib.get('VSIB', '0') == '0'  # asm += '[' + op.attrib.get('VSIB') + '0]'
        if op.attrib.get('memory-suffix', '') != '':
            raise _ParseFailed(f"Unsupported memory suffix {op.attrib.get('memory-suffix', '')}")

        choices = []
        if op.attrib.get('base', ''):
            choices = [op.attrib.get('base', '')]

        spec = _XMLOperandSpec()
        spec.type_ = "MEM"
        spec.values = choices
        spec.src = op.attrib.get('r', "0") == "1"
        spec.dest = op.attrib.get('w', "0") == "1"
        spec.width = int(op.attrib.get('width', '0'))
        return spec

    @staticmethod
    def _parse_agen_operand(_: ET.Element) -> _XMLOperandSpec:
        spec = _XMLOperandSpec()
        spec.type_ = "AGEN"
        spec.values = []
        spec.src = True
        spec.dest = False
        spec.width = 64
        return spec

    @staticmethod
    def _parse_imm_operand(op: ET.Element) -> _XMLOperandSpec:
        assert op.attrib is not None

        spec = _XMLOperandSpec()
        spec.type_ = "IMM"
        if op.attrib.get('implicit', '0') == '1':
            assert op.text is not None
            spec.values = [op.text]
        else:
            spec.values = []
        spec.src = True
        spec.dest = False
        spec.width = int(op.attrib.get('width', '0'))
        if op.attrib.get('s', '1') == '0':
            spec.is_signed = False
        return spec

    @staticmethod
    def _parse_label_operand(_: ET.Element) -> _XMLOperandSpec:
        spec = _XMLOperandSpec()
        spec.type_ = "LABEL"
        spec.values = []
        spec.src = True
        spec.dest = False
        spec.width = 0
        return spec

    @staticmethod
    def _parse_flags_operand(op: ET.Element) -> _XMLOperandSpec:
        spec = _XMLOperandSpec()
        spec.type_ = "FLAGS"
        spec.values = [
            op.attrib.get("flag_CF", ""),
            op.attrib.get("flag_PF", ""),
            op.attrib.get("flag_AF", ""),
            op.attrib.get("flag_ZF", ""),
            op.attrib.get("flag_SF", ""),
            op.attrib.get("flag_TF", ""),
            op.attrib.get("flag_IF", ""),
            op.attrib.get("flag_DF", ""),
            op.attrib.get("flag_OF", ""),
        ]
        spec.src = False
        spec.dest = False
        spec.width = 0
        return spec

    def add_missing(self) -> None:  # pylint: disable=too-many-statements
        """ Adds the instructions specs that are missing from the XML file we use """
        extensions = self.extensions
        if not extensions or "CLFSH" in extensions:
            for width in [8, 16, 32, 64]:
                inst = _XMLInstructionSpec()
                inst.name = "clflush"
                inst.category = "CLFSH-MISC"
                inst.is_control_flow = False
                op = _XMLOperandSpec()
                op.type_ = "MEM"
                op.values = []
                op.src = True
                op.dest = False
                op.width = width
                inst.operands = [op]
                self._instructions.append(inst)

        if not extensions or "CLFLUSHOPT" in extensions:
            for width in [8, 16, 32, 64]:
                inst = _XMLInstructionSpec()
                inst.name = "clflushopt"
                inst.category = "CLFLUSHOPT-CLFLUSHOPT"
                inst.is_control_flow = False
                op = _XMLOperandSpec()
                op.type_ = "MEM"
                op.values = []
                op.src = True
                op.dest = False
                op.width = width
                inst.operands = [op]
                self._instructions.append(inst)

        if not extensions or "BASE" in extensions:
            inst = _XMLInstructionSpec()
            inst.name = "int1"
            inst.category = "BASE-INTERRUPT"
            inst.is_control_flow = False
            op1 = _XMLOperandSpec()
            op1.type_, op1.src, op1.dest, op1.width = "REG", False, True, 64
            op1.values = ["rip"]
            op2 = _XMLOperandSpec()
            op2.type_, op2.src, op2.dest, op2.width = "FLAGS", False, False, 0
            op2.values = ["", "", "", "", "", "w", "w", "", ""]
            inst.implicit_operands = [op1, op2]
            self._instructions.append(inst)

    def _check_extension_list(self) -> None:
        # get a list of all available extensions
        available_extensions = set()
        for instruction_node in self._tree.iter('instruction'):
            available_extensions.add(instruction_node.attrib['extension'])

        # check if the requested extensions are available
        for ext in self.extensions:
            if ext not in available_extensions:
                print(f"ERROR: Unknown extension {ext}")
                print("\nAvailable extensions:")
                print(list(available_extensions))


class Downloader:
    """ A class that downloads the x86 instruction set and converts it to JSON """

    def __init__(self, extensions: List[str], out_file: str) -> None:
        if "ALL_SUPPORTED" in extensions:
            extensions.extend(SAFE_EXTENSIONS)
            extensions = list(set(extensions))
            extensions.remove("ALL_SUPPORTED")
        elif "ALL_SUPPORTED_DR" in extensions:
            extensions.extend(SAFE_EXTENSIONS_DR)
            extensions = list(set(extensions))
            extensions.remove("ALL_SUPPORTED_DR")
        elif "ALL_AND_UNSAFE" in extensions:
            extensions.extend(ALL_EXTENSIONS)
            extensions = list(set(extensions))
            extensions.remove("ALL_AND_UNSAFE")
        self.extensions = extensions
        self.out_file = out_file
        self._transformer = XMLSpecParser(self.extensions)

    def run(self) -> None:
        """ Downloads the XML file and converts it to JSON """

        print("> Downloading complete instruction spec...")
        subprocess.run(
            "curl -L -o x86_instructions.xml "
            "https://github.com/microsoft/side-channel-fuzzer/releases/download/"
            "v1.3.0/x86_instructions.xml",
            shell=True,
            check=True)

        print("\n> Filtering and transforming the instruction spec...")
        try:
            self._transformer.parse_file("x86_instructions.xml")
            self._transformer.add_missing()
            self._transformer.save_as_json(self.out_file)
        finally:
            subprocess.run("rm x86_instructions.xml", shell=True, check=True)

        n_parsed = len(self._transformer)
        n_all = self._transformer.n_instructions_in_xml
        print(f"Produced base.json with {n_parsed} instructions (out of {n_all} possible)")


# NOTE: for reference, the complete list of all categories available in the XML file is:
# "3DNOW-3DNOW", "ADOX_ADCX-ADOX_ADCX", "AES-AES", "AVXAES-AES", "AMX_BF16-AMX_TILE",
# "AMX_INT8-AMX_TILE", "AMX_TILE-AMX_TILE", "AVX2-AVX2", "AVX2GATHER-AVX2GATHER",
# "AVX512EVEX-AVX512_4FMAPS", "AVX512EVEX-AVX512_4VNNIW", "AVX512EVEX-AVX512_BITALG",
# "AVX512EVEX-AVX512", "AVX512EVEX-AVX512_VBMI", "AVX512EVEX-AVX512_VP2INTERSECT", "AVX-AVX",
# "BASE-BINARY", "BASE-BITBYTE", "SSE4a-BITBYTE", "AVX512EVEX-BLEND", "BMI1-BMI1", "BMI2-BMI2",
# "AVX-BROADCAST", "AVX2-BROADCAST", "AVX512EVEX-BROADCAST", "BASE-CALL", "CET-CET",
# "CLDEMOTE-CLDEMOTE", "CLFLUSHOPT-CLFLUSHOPT", "CLWB-CLWB", "CLZERO-CLZERO", "BASE-CMOV",
# "AVX512EVEX-COMPRESS", "BASE-COND_BR", "RTM-COND_BR", "AVX512EVEX-CONFLICT", "AVX-CONVERT",
# "AVX512EVEX-CONVERT", "BASE-CONVERT", "F16C-CONVERT", "LONGMODE-CONVERT", "SSE-CONVERT",
# "SSE2-CONVERT", "AVX-DATAXFER", "AVX2-DATAXFER", "AVX512EVEX-DATAXFER", "BASE-DATAXFER",
# "LONGMODE-DATAXFER", "MMX-DATAXFER", "MOVBE-DATAXFER", "SSE-DATAXFER", "SSE2-DATAXFER",
# "SSE3-DATAXFER", "SSE4a-DATAXFER", "ENQCMD-ENQCMD", "AVX512EVEX-EXPAND", "X87-FCMOV",
# "BASE-FLAGOP", "FMA4-FMA4", "AVX512EVEX-FP16", "AVX512EVEX-GATHER", "AVX512EVEX-GFNI",
# "GFNI-GFNI", "HRESET-HRESET", "AVX512EVEX-IFMA", "BASE-INTERRUPT", "BASE-IO",
# "BASE-IOSTRINGOP", "KEYLOCKER-KEYLOCKER", "KEYLOCKER_WIDE-KEYLOCKER_WIDE",
# "AVX512VEX-KMASK", "TDX-LEGACY", "AVX-LOGICAL", "AVX2-LOGICAL", "AVX512EVEX-LOGICAL",
# "BASE-LOGICAL", "MMX-LOGICAL", "RTM-LOGICAL", "SSE2-LOGICAL", "SSE4-LOGICAL",
# "AVX-LOGICAL_FP", "AVX512EVEX-LOGICAL_FP", "SSE-LOGICAL_FP", "SSE2-LOGICAL_FP",
# "LZCNT-LZCNT", "BASE-MISC", "CLFSH-MISC", "INVPCID-MISC", "MCOMMIT-MISC", "MONITOR-MISC",
# "MONITORX-MISC", "PAUSE-MISC", "SSE-MISC", "SSE2-MISC", "3DNOW-MMX", "MMX-MMX",
# "SSE2-MMX", "SSSE3-MMX", "MOVDIR-MOVDIR", "MPX-MPX", "BASE-NOP", "PCLMULQDQ-PCLMULQDQ",
# "PCONFIG-PCONFIG", "PKU-PKU", "BASE-POP", "LONGMODE-POP", "3DNOW_PREFETCH-PREFETCH",
# "SSE-PREFETCH", "PREFETCHWT1-PREFETCHWT1", "PTWRITE-PTWRITE", "BASE-PUSH", "LONGMODE-PUSH",
# "RDPID-RDPID", "RDPRU-RDPRU", "RDRAND-RDRAND", "RDSEED-RDSEED", "RDWRFSGS-RDWRFSGS",
# "BASE-RET", "LONGMODE-RET", "BASE-ROTATE", "AVX512EVEX-SCATTER", "BASE-SEGOP", "BASE-SEMAPHORE",
# "LONGMODE-SEMAPHORE", "SERIALIZE-SERIALIZE", "BASE-SETCC", "SGX-SGX", "SHA-SHA",
# "BASE-SHIFT", "SMAP-SMAP", "SSE-SSE", "SSE2-SSE", "SSE3-SSE", "SSE4-SSE", "SSSE3-SSE",
# "BASE-STRINGOP", "LONGMODE-STRINGOP", "AVX-STTNI", "BASE-SYSCALL", "LONGMODE-SYSCALL",
# "BASE-SYSRET", "LONGMODE-SYSRET", "AMD_INVLPGB-SYSTEM", "BASE-SYSTEM", "LONGMODE-SYSTEM",
# "RDTSCP-SYSTEM", "SMX-SYSTEM", "SNP-SYSTEM", "SVM-SYSTEM", "WBNOINVD-SYSTEM", "TBM-TBM",
# "TSX_LDTRK-TSX_LDTRK", "UINTR-UINTR", "BASE-UNCOND_BR", "RTM-UNCOND_BR", "AVX512EVEX-VAES",
# "VAES-VAES", "AVX512EVEX-VBMI2", "AVX_VNNI-VEX", "AVX512EVEX-VFMA", "FMA-VFMA",
# "VIA_PADLOCK_AES-VIA_PADLOCK", "VIA_PADLOCK_RNG-VIA_PADLOCK", "VIA_PADLOCK_SHA-VIA_PADLOCK",
# "AVX512EVEX-VPCLMULQDQ", "VPCLMULQDQ-VPCLMULQDQ", "VMFUNC-VTX", "VTX-VTX", "WAITPKG-WAITPKG",
# "BASE-WIDENOP", "SSE3-X87_ALU", "X87-X87_ALU", "XOP-XOP", "XSAVE-XSAVE", "XSAVEC-XSAVE",
# "XSAVES-XSAVE", "XSAVEOPT-XSAVEOPT"


================================================
FILE: rvzr/arch/x86/target_desc.py
================================================
"""
File: x86-specific constants and lists

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import List, Dict, Final, Tuple
import re
import unicorn.x86_const as ucc  # type: ignore

from rvzr.tc_components.instruction import Instruction
from rvzr.target_desc import TargetDesc, CPUDesc, UnicornTargetDesc, PTEBitNameMapper, \
    PTEBitOffset, PTEBitName


class X86TargetDesc(TargetDesc):
    """ Target description for x86 architecture. """

    register_sizes = {
        "mm0": 64, "mm1": 64, "mm2": 64, "mm3": 64, "mm4": 64, "mm5": 64, "mm6": 64, "mm7": 64,
        "xmm0": 128, "xmm1": 128, "xmm2": 128, "xmm3": 128, "xmm4": 128, "xmm5": 128, "xmm6": 128,
        "xmm7": 128,
        "ymm0": 256, "ymm1": 256, "ymm2": 256, "ymm3": 256, "ymm4": 256, "ymm5": 256, "ymm6": 256,
        "ymm7": 256,

        "rax": 64, "rbx": 64, "rcx": 64, "rdx": 64, "rsi": 64, "rdi": 64, "rsp": 64, "rbp": 64,
        "r8": 64, "r9": 64, "r10": 64, "r11": 64, "r12": 64, "r13": 64, "r14": 64, "r15": 64,

        "eax": 32, "ebx": 32, "ecx": 32, "edx": 32, "esi": 32, "edi": 32, "r8d": 32, "r9d": 32,
        "r10d": 32, "r11d": 32, "r12d": 32, "r13d": 32, "r14d": 32, "r15d": 32,

        "ax": 16, "bx": 16, "cx": 16, "dx": 16, "si": 16, "di": 16, "r8w": 16, "r9w": 16,
        "r10w": 16, "r11w": 16, "r12w": 16, "r13w": 16, "r14w": 16, "r15w": 16,

        "al": 8, "bl": 8, "cl": 8, "dl": 8, "sil": 8, "dil": 8, "r8b": 8, "r9b": 8,
        "r10b": 8, "r11b": 8, "r12b": 8, "r13b": 8, "r14b": 8, "r15b": 8,
        "ah": 8, "bh": 8, "ch": 8, "dh": 8,
    }  # yapf: disable

    registers_by_size = {
        8: ["al", "bl", "cl", "dl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b",
            "r14b", "r15b"],
        16: ["ax", "bx", "cx", "dx", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w",
             "r14w", "r15w"],
        32: ["eax", "ebx", "ecx", "edx", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d",
             "r13d", "r14d", "r15d"],
        64: ["rax", "rbx", "rcx", "rdx", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13",
             "r14", "r15", "rsp", "rbp", "mm0", "mm1", "mm2", "mm3", "mm4", "mm5", "mm6", "mm7"],
        128: ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7"],
        256: ["ymm0", "ymm1", "ymm2", "ymm3", "ymm4", "ymm5", "ymm6", "ymm7"],
    }  # yapf: disable

    reg_normalized = {
        "rax": "A", "eax": "A", "ax": "A", "al": "A", "ah": "A",
        "rbx": "B", "ebx": "B", "bx": "B", "bl": "B", "bh": "B",
        "rcx": "C", "ecx": "C", "cx": "C", "cl": "C", "ch": "C",
        "rdx": "D", "edx": "D", "dx": "D", "dl": "D", "dh": "D",
        "rsi": "SI", "esi": "SI", "si": "SI", "sil": "SI",
        "rdi": "DI", "edi": "DI", "di": "DI", "dil": "DI",
        "r8": "8", "r8d": "8", "r8w": "8", "r8b": "8",
        "r9": "9", "r9d": "9", "r9w": "9", "r9b": "9",
        "r10": "10", "r10d": "10", "r10w": "10", "r10b": "10",
        "r11": "11", "r11d": "11", "r11w": "11", "r11b": "11",
        "r12": "12", "r12d": "12", "r12w": "12", "r12b": "12",
        "r13": "13", "r13d": "13", "r13w": "13", "r13b": "13",
        "r14": "14", "r14d": "14", "r14w": "14", "r14b": "14",
        "r15": "15", "r15d": "15", "r15w": "15", "r15b": "15",
        "FLAGS": "FLAGS",
        "rip": "RIP",
        "rsp": "RSP",
        "CF": "CF", "PF": "PF", "AF": "AF", "ZF": "ZF", "SF": "SF", "TF": "TF", "IF": "IF",
        "DF": "DF", "OF": "OF", "AC": "AC",
        "mm0": "MM0",
        "mm1": "MM1",
        "mm2": "MM2",
        "mm3": "MM3",
        "mm4": "MM4",
        "mm5": "MM5",
        "mm6": "MM6",
        "mm7": "MM7",
        "xmm0": "XMM0",
        "xmm1": "XMM1",
        "xmm2": "XMM2",
        "xmm3": "XMM3",
        "xmm4": "XMM4",
        "xmm5": "XMM5",
        "xmm6": "XMM6",
        "xmm7": "XMM7",
        "ymm0": "YMM0",
        "ymm1": "YMM1",
        "ymm2": "YMM2",
        "ymm3": "YMM3",
        "ymm4": "YMM4",
        "ymm5": "YMM5",
        "ymm6": "YMM6",
        "ymm7": "YMM7",
        "cr0": "CR0",
        "cr2": "CR2",
        "cr3": "CR3",
        "cr4": "CR4",
        "cr8": "CR8",
        "xcr0": "XCR0",
        "dr0": "DR0",
        "dr1": "DR1",
        "dr2": "DR2",
        "dr3": "DR3",
        "dr6": "DR6",
        "dr7": "DR7",
        "gdtr": "GDTR",
        "idtr": "IDTR",
        "ldtr": "LDTR",
        "tr": "TR",
        "gs": "GS",
        "fs": "FS",
        "es": "ES",
        "ds": "DS",
        "cs": "CS",
        "ss": "SS",
        "fsbase": "FSBASE",
        "gsbase": "GSBASE",
        "msrs": "MSRS",
        "x87control": "X87CONTROL",
        "tsc": "TSC",
        "tscaux": "TSCAUX",
    }  # yapf: disable

    reg_denormalized = {
        "A": {64: "rax", 32: "eax", 16: "ax", 8: "al"},
        "B": {64: "rbx", 32: "ebx", 16: "bx", 8: "bl"},
        "C": {64: "rcx", 32: "ecx", 16: "cx", 8: "cl"},
        "D": {64: "rdx", 32: "edx", 16: "dx", 8: "dl"},
        "SI": {64: "rsi", 32: "esi", 16: "si", 8: "sil"},
        "DI": {64: "rdi", 32: "edi", 16: "di", 8: "dil"},
        "8": {64: "r8", 32: "r8d", 16: "r8w", 8: "r8b"},
        "9": {64: "r9", 32: "r9d", 16: "r9w", 8: "r9b"},
        "10": {64: "r10", 32: "r10d", 16: "r10w", 8: "r10b"},
        "11": {64: "r11", 32: "r11d", 16: "r11w", 8: "r11b"},
        "12": {64: "r12", 32: "r12d", 16: "r12w", 8: "r12b"},
        "13": {64: "r13", 32: "r13d", 16: "r13w", 8: "r13b"},
        "14": {64: "r14", 32: "r14d", 16: "r14w", 8: "r14b"},
        "15": {64: "r15", 32: "r15d", 16: "r15w", 8: "r15b"},
        "RIP": {64: "rip", 32: "rip", 16: "rip", 8: "rip"},
        "RSP": {64: "rsp", 32: "rsp", 16: "rsp", 8: "rsp"},
        "MM0": {64: "mm0"},
        "MM1": {64: "mm1"},
        "MM2": {64: "mm2"},
        "MM3": {64: "mm3"},
        "MM4": {64: "mm4"},
        "MM5": {64: "mm5"},
        "MM6": {64: "mm6"},
        "MM7": {64: "mm7"},
        "XMM0": {128: "xmm0"},
        "XMM1": {128: "xmm1"},
        "XMM2": {128: "xmm2"},
        "XMM3": {128: "xmm3"},
        "XMM4": {128: "xmm4"},
        "XMM5": {128: "xmm5"},
        "XMM6": {128: "xmm6"},
        "XMM7": {128: "xmm7"},
        "YMM0": {256: "ymm0"},
        "YMM1": {256: "ymm1"},
        "YMM2": {256: "ymm2"},
        "YMM3": {256: "ymm3"},
        "YMM4": {256: "ymm4"},
        "YMM5": {256: "ymm5"},
        "YMM6": {256: "ymm6"},
        "YMM7": {256: "ymm7"}
    }  # yapf: disable

    mem_index_registers = ["rax", "rbx", "rcx", "rdx", "rsi", "rdi"]

    page_property_to_pte_bit_name = {
        "present": ("present", False),
        "writable": ("writable", False),
        "user": ("user", False),
        'write-through': ("write-through", False),
        "cache-disable": ("cache-disable", False),
        "accessed": ("accessed", False),
        "dirty": ("dirty", False),
        "executable": ("non_executable", True),
        "reserved_bit": ("reserved_bit", False),
    }

    pte_bits: Dict[PTEBitName, Tuple[PTEBitOffset, bool]] = {
        # NAME: (position, default value)
        "present": (0, True),
        "writable": (1, True),
        "user": (2, False),
        "write-through": (3, False),
        "cache-disable": (4, False),
        "accessed": (5, True),
        "dirty": (6, True),
        "reserved_bit": (51, False),
        "non_executable": (63, True),
    }

    _page_property_to_epte_bit_name: PTEBitNameMapper = {
        "present": ("present", False),
        "writable": ("writable", False),
        "user": ("user", False),
        "accessed": ("accessed", False),
        "dirty": ("dirty", False),
        "executable": ("executable", False),
        "reserved_bit": ("reserved_bit", False),
    }

    _epte_bits_intel: Dict[PTEBitName, Tuple[PTEBitOffset, bool]] = {
        # NAME: (position, default value)
        "present": (0, True),
        "writable": (1, True),
        "executable": (2, False),
        "accessed": (8, True),
        "dirty": (9, True),
        "user": (10, False),
        "reserved_bit": (51, False),
    }

    _page_property_to_npte_bit_name: PTEBitNameMapper = {
        "present": ("present", False),
        "writable": ("writable", False),
        "user": ("user", False),
        "accessed": ("accessed", False),
        "dirty": ("dirty", False),
        "executable": ("non_executable", True),
        "reserved_bit": ("reserved_bit", False),
    }

    _npte_bits_amd: Dict[PTEBitName, Tuple[PTEBitOffset, bool]] = {
        # NAME: (position, default value)
        "present": (0, True),
        "writable": (1, True),
        "user": (2, True),
        "accessed": (5, True),
        "dirty": (6, True),
        "reserved_bit": (51, False),
        "non_executable": (63, True),
    }

    memory_addr_prefixes: Final[Dict[int, str]] = {
        8: "byte ptr",
        16: "word ptr",
        32: "dword ptr",
        64: "qword ptr",
        80: "tbyte ptr",
        128: "xmmword ptr",
        256: "ymmword ptr",
        512: "zmmword ptr",
        4608: "ptr",
    }

    def __init__(self) -> None:
        super().__init__()

        # modify/set target parameters based on the CPU under test and the configuration
        self.registers_by_size = self._filter_blocked_registers()
        self.cpu_desc = self._build_cpu_desc()

        # Select VM page table bits and property mapping based on vendor
        if self.cpu_desc.vendor == 'Intel':
            self.vm_pte_bits = self._epte_bits_intel
            self.page_property_to_vm_pte_bit_name = self._page_property_to_epte_bit_name
        else:
            self.vm_pte_bits = self._npte_bits_amd
            self.page_property_to_vm_pte_bit_name = self._page_property_to_npte_bit_name

        # connect Unicorn TD
        self.uc_target_desc = X86UnicornTargetDesc()

    @staticmethod
    def is_unconditional_branch(inst: Instruction) -> bool:
        return inst.category == "BASE-UNCOND_BR"

    @staticmethod
    def is_call(inst: Instruction) -> bool:
        return inst.category == "BASE-CALL"

    def _build_cpu_desc(self) -> CPUDesc:
        vendor = self.get_vendor()
        if vendor not in ["Intel", "AMD"]:
            return CPUDesc(vendor, 0, 0, 0)

        with open("/proc/cpuinfo", "r") as f:
            cpuinfo = f.read()

            family_match = re.search(r"cpu family\s+:\s+(.*)", cpuinfo)
            assert family_match, "Failed to find family in /proc/cpuinfo"
            family = int(family_match.group(1), 16)

            model_match = re.search(r"model\s+:\s+(.*)", cpuinfo)
            assert model_match, "Failed to find model name in /proc/cpuinfo"
            model = int(model_match.group(1), 16)

            stepping_match = re.search(r"stepping\s+:\s+(.*)", cpuinfo)
            assert stepping_match, "Failed to find stepping in /proc/cpuinfo"
            stepping = int(stepping_match.group(1), 16)

        return CPUDesc(vendor, model, family, stepping)


class X86UnicornTargetDesc(UnicornTargetDesc):  # pylint: disable=too-few-public-methods
    """ x86 target description in the context of a Unicorn-based model. """

    usable_registers: List[int] = [
        ucc.UC_X86_REG_RAX, ucc.UC_X86_REG_RBX, ucc.UC_X86_REG_RCX, ucc.UC_X86_REG_RDX,
        ucc.UC_X86_REG_RSI, ucc.UC_X86_REG_RDI, ucc.UC_X86_REG_EFLAGS, ucc.UC_X86_REG_RSP
    ]

    usable_simd128_registers: List[int] = [
        ucc.UC_X86_REG_XMM0, ucc.UC_X86_REG_XMM1, ucc.UC_X86_REG_XMM2, ucc.UC_X86_REG_XMM3,
        ucc.UC_X86_REG_XMM4, ucc.UC_X86_REG_XMM5, ucc.UC_X86_REG_XMM6, ucc.UC_X86_REG_XMM7
    ]

    reg_str_to_constant = {
        "al": ucc.UC_X86_REG_AL,
        "bl": ucc.UC_X86_REG_BL,
        "cl": ucc.UC_X86_REG_CL,
        "dl": ucc.UC_X86_REG_DL,
        "dil": ucc.UC_X86_REG_DIL,
        "sil": ucc.UC_X86_REG_SIL,
        "spl": ucc.UC_X86_REG_SPL,
        "bpl": ucc.UC_X86_REG_BPL,
        "ah": ucc.UC_X86_REG_AH,
        "bh": ucc.UC_X86_REG_BH,
        "ch": ucc.UC_X86_REG_CH,
        "dh": ucc.UC_X86_REG_DH,
        "ax": ucc.UC_X86_REG_AX,
        "bx": ucc.UC_X86_REG_BX,
        "cx": ucc.UC_X86_REG_CX,
        "dx": ucc.UC_X86_REG_DX,
        "di": ucc.UC_X86_REG_DI,
        "si": ucc.UC_X86_REG_SI,
        "sp": ucc.UC_X86_REG_SP,
        "bp": ucc.UC_X86_REG_BP,
        "eax": ucc.UC_X86_REG_EAX,
        "ebx": ucc.UC_X86_REG_EBX,
        "ecx": ucc.UC_X86_REG_ECX,
        "edx": ucc.UC_X86_REG_EDX,
        "edi": ucc.UC_X86_REG_EDI,
        "esi": ucc.UC_X86_REG_ESI,
        "esp": ucc.UC_X86_REG_ESP,
        "ebp": ucc.UC_X86_REG_EBP,
        "rax": ucc.UC_X86_REG_RAX,
        "rbx": ucc.UC_X86_REG_RBX,
        "rcx": ucc.UC_X86_REG_RCX,
        "rdx": ucc.UC_X86_REG_RDX,
        "rdi": ucc.UC_X86_REG_RDI,
        "rsi": ucc.UC_X86_REG_RSI,
        "rsp": ucc.UC_X86_REG_RSP,
        "rbp": ucc.UC_X86_REG_RBP,
        "xmm0": ucc.UC_X86_REG_XMM0,
        "xmm1": ucc.UC_X86_REG_XMM1,
        "xmm2": ucc.UC_X86_REG_XMM2,
        "xmm3": ucc.UC_X86_REG_XMM3,
        "xmm4": ucc.UC_X86_REG_XMM4,
        "xmm5": ucc.UC_X86_REG_XMM5,
        "xmm6": ucc.UC_X86_REG_XMM6,
        "xmm7": ucc.UC_X86_REG_XMM7
    }

    reg_norm_to_constant = {
        "A": ucc.UC_X86_REG_RAX,
        "B": ucc.UC_X86_REG_RBX,
        "C": ucc.UC_X86_REG_RCX,
        "D": ucc.UC_X86_REG_RDX,
        "DI": ucc.UC_X86_REG_RDI,
        "SI": ucc.UC_X86_REG_RSI,
        "SP": ucc.UC_X86_REG_RSP,
        "BP": ucc.UC_X86_REG_RBP,
        "8": ucc.UC_X86_REG_R8,
        "9": ucc.UC_X86_REG_R9,
        "10": ucc.UC_X86_REG_R10,
        "11": ucc.UC_X86_REG_R11,
        "12": ucc.UC_X86_REG_R12,
        "13": ucc.UC_X86_REG_R13,
        "14": ucc.UC_X86_REG_R14,
        "15": ucc.UC_X86_REG_R15,
        "FLAGS": ucc.UC_X86_REG_EFLAGS,
        "CF": ucc.UC_X86_REG_EFLAGS,
        "PF": ucc.UC_X86_REG_EFLAGS,
        "AF": ucc.UC_X86_REG_EFLAGS,
        "ZF": ucc.UC_X86_REG_EFLAGS,
        "SF": ucc.UC_X86_REG_EFLAGS,
        "TF": ucc.UC_X86_REG_EFLAGS,
        "IF": ucc.UC_X86_REG_EFLAGS,
        "DF": ucc.UC_X86_REG_EFLAGS,
        "OF": ucc.UC_X86_REG_EFLAGS,
        "AC": ucc.UC_X86_REG_EFLAGS,
        "XMM0": ucc.UC_X86_REG_XMM0,
        "XMM1": ucc.UC_X86_REG_XMM1,
        "XMM2": ucc.UC_X86_REG_XMM2,
        "XMM3": ucc.UC_X86_REG_XMM3,
        "XMM4": ucc.UC_X86_REG_XMM4,
        "XMM5": ucc.UC_X86_REG_XMM5,
        "XMM6": ucc.UC_X86_REG_XMM6,
        "XMM7": ucc.UC_X86_REG_XMM7,
        "XMM8": ucc.UC_X86_REG_XMM8,
        "XMM9": ucc.UC_X86_REG_XMM9,
        "XMM10": ucc.UC_X86_REG_XMM10,
        "XMM11": ucc.UC_X86_REG_XMM11,
        "XMM12": ucc.UC_X86_REG_XMM12,
        "XMM14": ucc.UC_X86_REG_XMM14,
        "XMM15": ucc.UC_X86_REG_XMM15,
        "RIP": -1,
        "RSP": -1,
        "CR0": -1,
        "CR2": -1,
        "CR3": -1,
        "CR4": -1,
        "CR8": -1,
        "XCR0": -1,
        "DR0": -1,
        "DR1": -1,
        "DR2": -1,
        "DR3": -1,
        "DR6": -1,
        "DR7": -1,
        "GDTR": -1,
        "IDTR": -1,
        "LDTR": -1,
        "TR": -1,
        "FSBASE": -1,
        "GSBASE": -1,
        "MSRS": -1,
        "X87CONTROL": -1,
        "TSC": -1,
        "TSCAUX": -1,
    }

    barriers: List[str] = ['mfence', 'lfence']
    flags_register: int = ucc.UC_X86_REG_EFLAGS
    pc_register: int = ucc.UC_X86_REG_RIP
    sp_register: int = ucc.UC_X86_REG_RSP
    actor_base_register: int = ucc.UC_X86_REG_R14


================================================
FILE: rvzr/asm_parser.py
================================================
"""
File: Parsing of assembly files into our internal representation (TestCaseCode).
      This file contains ISA-independent code; see <isa>/<isa>_asm_parser.py for ISA-specific code.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from dataclasses import dataclass
from typing import TYPE_CHECKING, Dict, List, Final, Optional
from abc import ABC, abstractmethod
from collections import OrderedDict
import re
import os

from .tc_components.test_case_code import TestCaseProgram, Function, BasicBlock, TC_EXIT_LABEL
from .tc_components.instruction import Instruction, LabelOp, Operand, RegisterOp, MemoryOp, \
    ImmediateOp, AgenOp, CondOp, AnyOperand
from .instruction_spec import OT, InstructionSpec, OperandSpec
from .tc_components.actor import ActorPL, ActorMode
from .code_generator import assemble
from .config import CONF

if TYPE_CHECKING:
    from .target_desc import TargetDesc
    from .isa_spec import InstructionSet
    from .elf_parser import ELFParser
    from .code_generator import CodeGenerator

RE_REDUNDANT_SPACES = re.compile(r"(?<![a-zA-Z0-9]) +")
TC_EXIT_LINE = TC_EXIT_LABEL + ":"


class AsmParserError(Exception):
    """ Base exception class for AsmParser module """

    def __init__(self, line_num: int, message: str) -> None:
        full_msg = f"[AsmParser] Error parsing assembly (line {line_num + 1}):\n{message}"
        super().__init__(full_msg)


def asm_parser_assert(condition: bool, line_number: int, explanation: str) -> None:
    """ Raise an AsmParserError if the condition is not met """

    if not condition:
        raise AsmParserError(line_number, explanation)


@dataclass
class _ASMLine:
    """ Metadata for a single line of assembly code """

    def __init__(self, str_: str, line_num: int) -> None:
        self.str = str_
        self.clean_str = str_.strip().lower()
        self.clean_str = RE_REDUNDANT_SPACES.sub("", self.clean_str)
        self.line_num = line_num
        self.patched_line_num = 0
        self.clean_line_num = 0


# ==================================================================================================
# Private: Code Map Builder
# ==================================================================================================
_BBLabel = str
_BasicBlockMap = OrderedDict[_BBLabel, List[_ASMLine]]
_FunctionName = str
_FunctionMap = OrderedDict[_FunctionName, _BasicBlockMap]
_SectionLabel = str
_CodeMap = OrderedDict[_SectionLabel, _FunctionMap]


class _CodeMapBuilder:
    """
    Class responsible for building a dictionary of sections, functions, basic blocks,
    and relationships between them in an assembly file
    """

    section_label: Optional[str] = None
    function_label: Optional[str] = None
    bb_label: Optional[str] = None
    bb_is_autogenerated: bool = False
    code_map: _CodeMap

    def create_code_map(self, lines: List[_ASMLine]) -> _CodeMap:
        """
        Parse lines and build a map of sections, functions, and basic blocks
        in the test case
        :param lines: representation of the assembly file as a list of ASMLine objects
        :return: a dictionary representing the code structure of the test case (_CodeMap)
        """
        self.code_map: _CodeMap = OrderedDict()

        # Parse each line according to its type and accumulate the code structure as we go
        for line_obj in lines:
            line_num = line_obj.line_num
            line = line_obj.clean_str
            type_ = self._get_line_type(line_obj)

            if type_ == "ignore":
                continue

            if type_ == "section":
                self._start_section(line_obj)
                continue

            if type_ == "function":
                self._start_function(line_obj)
                continue
            if self.function_label is None and self.section_label is not None:
                self._create_default_main_function()  # allow for implicit functions

            if type_ == "basic_block":
                self._start_basic_block(line_obj)
                continue

            if type_ == "instruction":
                self._add_instruction(line_obj)
                continue

            if type_ == "opcode":
                self._add_instruction(_ASMLine("opcode", line_num))
                continue

            if type_ == "macro":
                str_ = self._macro_label_to_instr(line, line_num)
                self._add_instruction(_ASMLine(str_, line_num))

        return self.code_map

    def _get_line_type(self, line: _ASMLine) -> str:
        # pylint: disable=too-many-return-statements
        # NOTE: This is a selector, so it is expected to have many returns

        line_str = line.clean_str
        if line_str[0] != ".":
            return "instruction"
        if line_str.startswith(".global") or line_str.startswith(".intel_syntax"):
            return "ignore"
        if line_str.startswith(".section"):
            return "section"
        if line_str.startswith(".function_"):
            return "function"
        if line_str.startswith(".macro"):
            return "macro"
        if line_str[:4] == ".bcd " or line_str[:5] in [".byte", ".long", ".quad"] \
           or line_str[6:] in [".value", ".2byte", ".4byte", ".8byte"]:
            return "opcode"
        if line_str[-1] == ":":
            return "basic_block"
        raise NotImplementedError(f"Line {line.line_num}: Unknown line type: {line_str}")

    def _start_section(self, line: _ASMLine) -> None:
        line_str = line.clean_str
        words = line.clean_str.split()
        assert len(words) == 2, \
            f"Line {line.line_num}: Invalid section label {line_str}; expected .section <label>"

        # exit section does not represent any actor; ignore it
        if words[1] == "exit":
            return

        # parse the section label
        sub_words = words[1].split(".")
        assert len(sub_words) == 3, \
            f"Line {line.line_num}: Invalid section label: {line_str}"

        label = sub_words[2]
        assert label in CONF.get_actors_conf(), \
            f"Line {line.line_num}: Actor {label} was not defined in the config file"

        # update the parser state to reflect that a new section has started
        if label not in self.code_map:
            self.code_map[label] = OrderedDict()
        self.section_label = label
        self.function_label = None
        self.bb_label = None

    def _start_function(self, line: _ASMLine) -> None:
        assert self.section_label is not None, \
            f"Line {line.line_num}: Function started before a .section was declared"

        # get label
        line_str = line.clean_str
        assert line_str[-1] == ":", f"Invalid function header: {line_str}"
        label = line_str[:-1]

        # update the parser state to reflect that a new function has started
        self.function_label = label
        self.code_map[self.section_label][label] = OrderedDict()

        default_start_bb = ".bb_" + label.removeprefix(".function_") + ".entry"
        self.bb_label = default_start_bb
        self.bb_is_autogenerated = True
        self.code_map[self.section_label][label][default_start_bb] = []

    def _create_default_main_function(self) -> None:
        assert self.section_label is not None, \
            "Function started before a .section was declared"

        default_label = f".function_{self.section_label}_0"
        self.function_label = default_label
        self.code_map[self.section_label][default_label] = OrderedDict()

        default_start_bb = f".bb_{self.section_label}_0.entry"
        self.bb_label = default_start_bb
        self.bb_is_autogenerated = True
        self.code_map[self.section_label][default_label][default_start_bb] = []

    def _start_basic_block(self, line: _ASMLine) -> None:
        assert self.section_label is not None, \
            f"Line {line.line_num}: Basic block started before a .section was declared"
        assert self.function_label is not None, \
            f"Line {line.line_num}: Basic block started before a .function was declared"
        assert self.bb_label is not None, \
            f"Line {line.line_num}: Default basic block was not created"

        # get label
        line_str = line.clean_str
        assert line_str[-1] == ":", f"Invalid basic block header: {line_str}"
        label = line_str[:-1]

        # overwrite default BB added to every function, if it is still empty
        bb_map = self.code_map[self.section_label][self.function_label]
        if len(bb_map) == 1 and len(bb_map[self.bb_label]) == 0 \
           and self.bb_is_autogenerated:
            del self.code_map[self.section_label][self.function_label][self.bb_label]

        # update the parser state to reflect that a new basic block has started
        self.bb_label = label
        self.bb_is_autogenerated = False
        assert label not in self.code_map[self.section_label][self.function_label], \
            f"Line {line.line_num}: Duplicate basic block label: {label}"
        self.code_map[self.section_label][self.function_label][label] = []

    def _add_instruction(self, line: _ASMLine) -> None:
        assert self.section_label is not None, \
            f"Line {line.line_num}: Instruction found before a .section was declared"
        assert self.function_label is not None, \
            f"Line {line.line_num}: Instruction found before a .function was declared"
        assert self.bb_label is not None, \
            f"Line {line.line_num}: Instruction found before a basic block was declared"

        self.code_map[self.section_label][self.function_label][self.bb_label].append(line)

    def _macro_label_to_instr(self, line: str, line_num: int) -> str:
        """
        This function replaces label-like macros with a pseudo-instruction MACRO
        As such, we simplify further parsing of the test case
        """
        # get rid of the NOP placeholder
        words = line.split(":")
        asm_parser_assert(len(words) == 2, line_num, "Invalid macro declaration")
        asm_parser_assert(words[1][:3] == "nop", line_num, "Patching error")

        # get the macro name and its arguments
        subwords = words[0].split(".")
        asm_parser_assert(len(subwords) >= 3, line_num, f"Invalid macro: {line}")
        asm_parser_assert(len(subwords) <= 7, line_num, f"Invalid macro: {line}")
        macro_id = subwords[2]
        args = '.'.join(subwords[3:])
        if args:
            instr = f"macro .{macro_id}, .{args}"
        else:
            instr = f"macro .{macro_id}, .noarg"

        return instr


# ==================================================================================================
# Private: Patching of assembly files
# ==================================================================================================
class _AsmPatcher:
    _main_function_label: str = ""
    _macro_placeholder_str: Optional[str] = None

    def set_macro_placeholder(self, macro_placeholder_str: str) -> None:
        """
        Assign a string to be used as a placeholder for macro instructions.

        This method exist to allow re-use of the _AsmPatcher class between different ISAs.
        """
        assert self._macro_placeholder_str is None, \
            "Macro placeholder string was already set"
        self._macro_placeholder_str = macro_placeholder_str

    def patch_asm(self, asm_file: str, patched_asm_file: str) -> None:
        """
        Ensure that the assembly file is in the correct format for parsing:
        - all function labels are exposed by adding a global label
        - NOP is added at the end of each function to make size calculations easier
        - .function_0 is inserted at the beginning of the file if it is missing
        - .test_case_exit is within the .data.main section and contains a single NOP
        """
        self._main_function_label = ""
        self._pre_clean(asm_file, patched_asm_file)

        # apply the patches
        self._add_exit_section(patched_asm_file)
        self._add_default_main(patched_asm_file)
        self._add_macro_placeholders(patched_asm_file)
        self._add_default_measurements(patched_asm_file)

    def _is_instruction(self, line: str) -> bool:
        return line != '' and line[0] not in ["#", "/"] \
            and (line[0] != '.' or line[:4] == ".bcd"
                 or line[:5] in [".byte", ".long", ".quad"] or line[:6] == '.macro'
                 or line[6:] in [".value", ".2byte", ".4byte", ".8byte"])

    def _pre_clean(self, asm_file: str, patched_asm_file: str) -> None:
        with open(asm_file, "r") as f:
            with open(patched_asm_file, "w") as patched:
                for line in f:
                    line = line.strip().lower()
                    patched.write(line + "\n")

    def _add_exit_section(self, patched_asm_file: str) -> None:
        prev_line = ""
        with open(patched_asm_file, "r") as f:
            with open(patched_asm_file + ".tmp", "w") as patched:
                for line in f:
                    line = line[:-1]
                    if ".test_case_exit:" in line:
                        if ".data.main" not in prev_line or "measurement_end" in prev_line:
                            patched.write(".section .data.main\n")
                        patched.write(".test_case_exit:" + "nop" + "\n")
                        continue
                    patched.write(line + "\n")
                    prev_line = line
        os.rename(patched_asm_file + ".tmp", patched_asm_file)

    def _add_default_main(self, patched_asm_file: str) -> None:
        main_function_label = ""
        with open(patched_asm_file, "r") as f:
            with open(patched_asm_file + ".tmp", "w") as patched:
                for line in f:
                    line = line[:-1]

                    # if we already have a main function, just copy the rest of the file
                    if main_function_label:
                        patched.write(line + "\n")
                        continue

                    # reached the end of the file
                    if ".test_case_exit:" in line:
                        main_function_label = ".function_0"
                        patched.write(".function_0:\n")
                        patched.write(line + "\n")
                        continue

                    # found the main function
                    if line.startswith(".function_"):
                        main_function_label = line[:-1]
                        patched.write(line + "\n")
                        continue

                    # found an instruction before the main function
                    if self._is_instruction(line):
                        patched.write(".function_0:\n")
                        main_function_label = ".function_0"
                        patched.write(line + "\n")
                        continue

                    # copy non-instruction lines
                    patched.write(line + "\n")

        self._main_function_label = main_function_label
        os.rename(patched_asm_file + ".tmp", patched_asm_file)

    def _add_macro_placeholders(self, patched_asm_file: str) -> None:
        """ add NOP placeholders after macros """
        assert self._macro_placeholder_str is not None, \
            "set_macro_placeholder() was not called before patching"

        with open(patched_asm_file, "r") as f:
            with open(patched_asm_file + ".tmp", "w") as patched:
                for line in f:
                    line = line.lower()
                    if line.startswith(".macro"):
                        if "nop" not in line:
                            patched.write(line[:-1] + self._macro_placeholder_str + "\n")
                        else:
                            assert self._macro_placeholder_str in line, \
                                "Unexpected NOP placeholder: " + line
                            patched.write(line)
                    else:
                        patched.write(line)
        os.rename(patched_asm_file + ".tmp", patched_asm_file)

    def _add_default_measurements(self, patched_asm_file: str) -> None:
        assert self._macro_placeholder_str is not None, \
            "set_macro_placeholder() was not called before patching"

        # identify if the file already has the measurement macros;
        # this information is used by multiple patching steps
        has_measurement_start = False
        has_measurement_end = False
        with open(patched_asm_file, "r") as f:
            for line in f:
                line = line.lower()
                if line.startswith(".macro.measurement_start"):
                    has_measurement_start = True
                elif line.startswith(".macro.measurement_end"):
                    has_measurement_end = True

        # add .macro.measurement_start after .function_0
        if not has_measurement_start:
            with open(patched_asm_file, "r") as f:
                with open(patched_asm_file + ".tmp", "w") as patched:
                    for line in f:
                        line = line.lower()
                        patched.write(line)
                        if line.startswith(self._main_function_label):
                            patched.write(".macro.measurement_start:" + self._macro_placeholder_str
                                          + "\n")
            os.rename(patched_asm_file + ".tmp", patched_asm_file)

        # add .macro.measurement_end before .test_case_exit
        if not has_measurement_end:
            with open(patched_asm_file, "r") as f:
                with open(patched_asm_file + ".tmp", "w") as patched:
                    prev_line = ""
                    for line in f:
                        line = line.lower()
                        if line.startswith(".test_case_exit:"):
                            if prev_line.startswith(".section"):
                                patched.write(".function_end:\n")
                            patched.write(".macro.measurement_end:" + self._macro_placeholder_str
                                          + "\n")
                        patched.write(line)
                        prev_line = line
            os.rename(patched_asm_file + ".tmp", patched_asm_file)


# ==================================================================================================
# Public (intended for <isa>/asm_parser.py): Line parsing
# ==================================================================================================
class AsmLineParser(ABC):
    """
    Class responsible for parsing an assembly line into an Instruction object.

    This class is a common ISA-independent functionality with hooks to be implemented by
    ISA-specific subclasses.
    """
    _instruction_map: Final[Dict[str, List[InstructionSpec]]]
    _curr_ln: int
    _comment_char: str  # set by subclasses

    def __init__(self, isa_spec: InstructionSet, target_desc: TargetDesc) -> None:
        self._instruction_map = self._build_instruction_map(isa_spec)
        self._target_desc = target_desc
        self._curr_ln = -1

    # ----------------------------------------------------------------------------------------------
    # Hooks for ISA-specific subclasses
    @abstractmethod
    def _tokenize(self, line: str) -> List[str]:
        """ Tokenize the line and store the results internally """

    @abstractmethod
    def _get_instruction_name(self, line: str, tokens: List[str]) -> str:
        """ Get the instruction name from the line, based on the tokenized data """

    @abstractmethod
    def _get_instruction_operands(self, line: str, name: str, tokens: List[str]) -> List[str]:
        """ Get the instruction operands from the line, based on the tokenized data """

    @abstractmethod
    def _get_initial_candidate_specs(self, line: str, name: str) -> List[InstructionSpec]:
        """ Get a list of candidate specs for the given assembly line """

    @abstractmethod
    def _check_if_spec_matches(self, spec: InstructionSpec, operands_raw: List[str]) -> bool:
        """ Check if the given spec matches the given list of operand strings """

    # ----------------------------------------------------------------------------------------------
    # Common ISA-independent Functionality
    @staticmethod
    def _build_instruction_map(isa_spec: InstructionSet) -> Dict[str, List[InstructionSpec]]:
        instruction_map: Dict[str, List[InstructionSpec]] = {}
        for spec in isa_spec.instructions_unfiltered:
            if spec.name in instruction_map:
                instruction_map[spec.name].append(spec)
            else:
                instruction_map[spec.name] = [spec]

            # add an entry for direct opcodes
            opcode_spec = InstructionSpec("opcode", "opcode")
            instruction_map["opcode"] = [opcode_spec]

            # entry for macros
            macro_spec = InstructionSpec("macro", "macro")
            macro_spec.operands = [
                OperandSpec([], OT.LABEL, False, False),
                OperandSpec([], OT.LABEL, False, False)
            ]
            instruction_map["macro"] = [macro_spec]
        return instruction_map

    def parse_line(self, line: str, line_num: int) -> Instruction:
        """ Implementation of the AsmLineParser interface for x86 assembly lines (Intel syntax) """
        self._curr_ln = line_num

        # Identify the line type
        line = line.lower()
        is_instrumentation = "instrumentation" in line
        is_noremove = "noremove" in line

        # Remove comments
        if self._comment_char in line:
            line = line.split(self._comment_char)[0].strip()

        # Get instruction name and operands
        tokens = self._tokenize(line)
        name = self._get_instruction_name(line, tokens)
        operands_raw = self._get_instruction_operands(line, name, tokens)

        # Find a matching spec
        spec = self._find_matching_spec(line, name, operands_raw)

        # generate a corresponding Instruction
        inst = self._create_instruction(spec, operands_raw, is_instrumentation, is_noremove)
        inst.assign_line_num(line_num)

        return inst

    def _find_matching_spec(self, line: str, name: str, operands_raw: List[str]) -> InstructionSpec:
        """ Find the InstructionSpec that matches the given assembly line """

        # Get candidate specs
        specs = self._get_initial_candidate_specs(line, name)
        if len(specs) == 0:
            raise AsmParserError(self._curr_ln, f"Unknown instruction {line}")

        # find a matching spec
        matching_specs: List[InstructionSpec] = []
        for spec_candidate in specs:
            if self._check_if_spec_matches(spec_candidate, operands_raw):
                matching_specs.append(spec_candidate)
        if len(matching_specs) == 0:
            raise AsmParserError(self._curr_ln, f"Could not find a matching spec for {line}")

        # we might find several matches if the instruction has a magic operand value
        if len(matching_specs) > 1:
            magic_value_specs = list(filter(lambda x: (x.has_magic_value), matching_specs))
            if magic_value_specs:
                matching_specs = magic_value_specs

        # at this point we should have only one spec, but even if we don't, all of them should
        # be equivalent. Just pick the first
        return matching_specs[0]

    def _create_instruction(self, spec: InstructionSpec, operands_raw: List[str],
                            is_instrumentation: bool, is_noremove: bool) -> Instruction:
        """
        Create an Instruction object and its operands based on the assembly line
        and the spec that describes the instruction
        """
        # create the instruction with no operands
        inst = Instruction.from_spec(
            spec, is_instrumentation=is_instrumentation, is_noremove=is_noremove)

        # create operands
        op: AnyOperand
        for op_id, op_raw in enumerate(operands_raw):
            op_spec = spec.operands[op_id]
            if op_spec.type == OT.REG:
                op = RegisterOp(op_raw, op_spec.width, op_spec.src, op_spec.dest)
            elif op_spec.type == OT.MEM:
                address_match = re.search(r'\[(.*)\]', op_raw)
                asm_parser_assert(address_match is not None, self._curr_ln,
                                  "Invalid memory address")
                address = address_match.group(1)  # type: ignore
                op = MemoryOp(address, op_spec.width, op_spec.src, op_spec.dest)
            elif op_spec.type == OT.IMM:
                op = ImmediateOp(op_raw, op_spec.width)
            elif op_spec.type == OT.LABEL:
                assert spec.is_control_flow or spec.name == "macro"
                op = LabelOp(op_raw)
            elif op_spec.type == OT.COND:
                op = CondOp(op_raw)
            else:  # AGEN
                address_match = re.search(r'\[(.*)\]', op_raw)
                asm_parser_assert(address_match is not None, self._curr_ln,
                                  "Invalid memory address")
                address = address_match.group(1)  # type: ignore
                op = AgenOp(address, op_spec.width)
            inst.operands.append(op)
        # add implicit operands
        for op_spec in spec.implicit_operands:
            # implicit operands should always have fixed spec, hence it's safe to use
            # the from_fixed_spec constructor
            op = Operand.from_fixed_spec(op_spec)
            inst.implicit_operands.append(op)
        return inst


# ==================================================================================================
# Public: High-level ASM Parser
# ==================================================================================================
class AsmParser(ABC):
    """
    Class responsible for parsing (and optionally patching) assembly files
    and producing TestCaseCode objects from them
    """

    _target_desc: Final[TargetDesc]
    _isa_spec: Final[InstructionSet]
    _asm_patcher: _AsmPatcher
    _line_parser: AsmLineParser
    _lines: List[_ASMLine]

    def __init__(self, isa_spec: InstructionSet, target_desc: TargetDesc) -> None:
        self._isa_spec = isa_spec
        self._target_desc = target_desc
        self._asm_patcher = _AsmPatcher()

    # ----------------------------------------------------------------------------------------------
    # Public Interface
    def parse_file(self,
                   asm_file: str,
                   generator: CodeGenerator,
                   elf_parser: ELFParser,
                   is_template: bool = False) -> TestCaseProgram:
        """
        Read a test case from a file, patch it to make it parsable (if necessary),
        create a complete TestCaseCode object based on it, and populate it with ELF data.

        This function is used instead of ProgramGenerator.create_test_case() when Revizor works
        with a user-provided test case. Hence, this function's output is expected to be
        equivalent to the output of ProgramGenerator.create_test_case().

        :param asm_file: path to the input assembly file to parse
        :param generator: an instance of ProgramGenerator object to assist in creating the test case
        :param elf_parser: an instance of ELFParser object to assist in creating the test case
        :return: a fully constructed TestCaseCode object
        """
        # Transform the input file into a list of ASMLine objects
        with open(asm_file, 'r') as f:
            dirty_lines = [_ASMLine(l, i) for i, l in enumerate(f)]

        # Apply patches to the assembly file to make it parsable
        patched_asm_file = asm_file + ".patched.asm"
        self._patch_asm(asm_file, patched_asm_file)
        dirty_lines = self._update_lines_after_patch(patched_asm_file, dirty_lines)

        # Build a map of the code structure
        clean_lines = self._get_clean_lines(dirty_lines)
        code_map = _CodeMapBuilder().create_code_map(clean_lines)

        # Create an empty test case with actors set up according to the configuration
        test_case = TestCaseProgram(patched_asm_file)
        generator.generate_actors_with_sections(test_case, CONF.get_actors_conf())

        # Fill the test case with the object representations of the parsed assembly
        self._fill_test_case_structure(test_case, code_map)
        assert len(test_case) > 0, "Default section not found"
        self._connect_control_flow(test_case)

        # Handle empty and trivial assembly files
        if len(test_case) == 1 and len(test_case[0]) == 0 and len(test_case[0][0]) == 0:
            self._handle_empty_test_case(test_case)

        # Perform final correctness checks
        self._check_test_case_correctness(test_case)

        # Assemble the test case and populate with ELF data
        if not is_template:  # there is no point in assembling a template
            test_case.assign_obj(asm_file[:-4] + ".o")
            assemble(test_case)
            elf_parser.populate_elf_data(test_case.get_obj(), test_case)

        return test_case

    # ----------------------------------------------------------------------------------------------
    # Private: Assembly Patching
    def _patch_asm(self, asm_file: str, patched_asm_file: str) -> None:
        return self._asm_patcher.patch_asm(asm_file, patched_asm_file)

    def _update_lines_after_patch(self, patched_asm_file: str,
                                  org_lines: List[_ASMLine]) -> List[_ASMLine]:
        """
        Create a list of ASMLine objects from the patched assembly file, such that
        the line number correspond to the original assembly file if the line was not patched
        """

        patched_lines = []
        with open(patched_asm_file, 'r') as patched:
            org_line_num = 0
            for patched_line_num, p_line in enumerate(patched):
                o_line_obj = org_lines[org_line_num]
                o_line = o_line_obj.str.strip().lower()

                p_line = p_line.strip().lower()
                p_line_obj = _ASMLine(p_line, 0)
                p_line_obj.patched_line_num = patched_line_num

                if o_line in p_line:
                    p_line_obj.line_num = o_line_obj.line_num
                    org_line_num += 1

                patched_lines.append(p_line_obj)
        return patched_lines

    # ----------------------------------------------------------------------------------------------
    # Private: Line Parsing
    def _get_clean_lines(self, org_lines: List[_ASMLine]) -> List[_ASMLine]:
        """ Remove comments and empty lines from a list of ASMLine objects """
        self._validate_dirty_lines(org_lines)

        lines = []
        finished = False
        for line_obj in org_lines:
            line_str = line_obj.str

            # Skip comments and empty lines
            if not line_str or line_str[0] in ["", "#", "/"]:
                continue

            # Skip lines after test case exit
            if line_str[:16] == TC_EXIT_LINE:
                finished = True
                continue
            if finished:
                continue

            # Save all other lines
            lines.append(line_obj)

        return lines

    def _validate_dirty_lines(self, lines: List[_ASMLine]) -> None:
        """ Check that the list of lines is well-formed """
        finished = False
        for line_obj in lines:
            line_str = line_obj.clean_str
            if not line_str:
                continue
            if line_str[:16] == TC_EXIT_LINE:
                finished = True
                continue

            # Check that there are no instructions after .test_case_exit
            if finished and line_str[0] not in ["", ".", "#", "/"]:
                raise AsmParserError(line_obj.line_num,
                                     f"Found instructions after .test_case_exit: {line_obj.str}")

        if not finished:
            raise AsmParserError(0, ".test_case_exit not found")

    def _parse_line(self, line: str, line_num: int) -> Instruction:
        return self._line_parser.parse_line(line, line_num)

    # ----------------------------------------------------------------------------------------------
    # Private: Building Test Case Structure
    def _fill_test_case_structure(self, test_case: TestCaseProgram, code_map: _CodeMap) -> None:
        """
        Initialize the structure of the test case according to the code map.
        The function fills the test case with sections, functions, basic blocks,
        instructions, and connects them
        :param test_case: the test case to be filled
        :param code_map: the code map representing the structure of the parsed assembly
        :return: None
        """
        for section_name, function_map in code_map.items():
            section = test_case.find_section(name=section_name)

            for func_name, bb_map in function_map.items():
                func = Function(func_name, section)
                section.append(func)

                for bb_name, inst_lines in bb_map.items():
                    # print(">>", bb_name)
                    bb = BasicBlock(bb_name, func)
                    func.append(bb)

                    terminators_started = False
                    for line in inst_lines:
                        # print(f"    {line}")
                        inst = self._parse_line(line.clean_str, line.line_num)
                        if not inst.is_control_flow:
                            assert not terminators_started, \
                                f"Line {line.line_num}: Terminator not at the end of BB"
                            bb.insert_after(bb.get_last(), inst)
                            continue

                        terminators_started = True
                        bb.terminators.append(inst)

    def _connect_control_flow(self, test_case: TestCaseProgram) -> None:
        """
        Connect the basic blocks in the test case by following their terminators
        :param test_case: the test case to connect
        :return: None
        """
        # connect basic blocks
        bb_names = {bb.name.lower(): bb for func in test_case.iter_functions() for bb in func}
        bb_names[TC_EXIT_LABEL] = test_case.get_tc_exit_bb()
        previous_bb = None
        for func in test_case.iter_functions():
            for bb in func:
                # fallthrough
                if previous_bb:  # skip the first BB
                    # there is a fallthrough only if the last terminator is not a direct jump
                    if not previous_bb.terminators or \
                       not self._target_desc.is_unconditional_branch(previous_bb.terminators[-1]):
                        previous_bb.successors.append(bb)
                previous_bb = bb

                # taken branches
                for terminator in bb.terminators:
                    # skip calls as they target functions, not basic blocks
                    if self._target_desc.is_call(terminator):
                        continue

                    for op in terminator.operands:
                        if isinstance(op, LabelOp):
                            asm_parser_assert(op.value in bb_names, -1, "Unknown label " + op.value)
                            successor = bb_names[op.value]
                            bb.successors.append(successor)

            # last BB always falls through to the exit
            func[-1].successors.append(func.get_exit_bb())

    def _handle_empty_test_case(self, test_case: TestCaseProgram) -> None:
        main = Function(".function_0", test_case.find_section(name="main"))
        test_case[0].append(main)

        bb = BasicBlock(".bb_0", main)
        main.append(bb)

        instr = Instruction("nop", "BASE-NOP")
        bb.insert_after(bb.get_last(), instr)
        bb.successors.append(main.get_exit_bb())

    # ----------------------------------------------------------------------------------------------
    # Private: Correctness Checks
    def _check_test_case_correctness(self, test_case: TestCaseProgram) -> None:
        """ Check that the TestCaseCode object created from the assembly file is correct """
        self._check_landing_sites(test_case)
        self._check_fault_handler(test_case)
        self._check_set_data_permission(test_case)

    def _check_landing_sites(self, test_case: TestCaseProgram) -> None:
        """ check that all actor switch macros have landing sites """
        # pylint: disable=too-many-branches
        # NOTE: there are many checks to be performed on the set_* family of macros, so
        # having many branches is expected

        switch_labels = [".set_k2u_target", ".set_u2k_target", ".set_h2g_target", ".set_g2h_target"]
        switches = []
        for func in test_case.iter_functions():
            for bb in func:
                for inst in bb:
                    if inst.name == "macro" and inst.operands[0].value in switch_labels:
                        switches.append(inst)

        for switch in switches:
            target = switch.operands[1].value.split(".")[2]
            for func in test_case.iter_functions():
                stripped_name = func.name[1:]
                if stripped_name == target:
                    target_function = func
                    break
            else:
                raise AsmParserError(-1, f"Macro {switch} targets a non-existing function")

            first_bb = target_function.get_first_bb()
            assert first_bb is not None, f"Macro {switch} targets a function without basic blocks"
            first_node = first_bb.get_first()
            assert first_node is not None, f"Macro {switch} targets a basic block without a landing"
            if not first_node.instruction.operands or \
               "landing" not in first_node.instruction.operands[0].value:
                raise AsmParserError(-1, f"{switch} does not target a landing site macro")
            target_name = first_node.instruction.operands[0].value

            if switch.operands[0].value == ".set_k2u_target" and target_name != ".landing_k2u":
                raise AsmParserError(switch.line_num(), f"{switch} does not target landing_k2u")
            if switch.operands[0].value == ".set_u2k_target" and target_name != ".landing_u2k":
                raise AsmParserError(switch.line_num(), f"{switch} does not target landing_u2k")
            if switch.operands[0].value == ".set_h2g_target" and target_name != ".landing_h2g":
                raise AsmParserError(switch.line_num(), f"{switch} does not target landing_h2g")
            if switch.operands[0].value == ".set_g2h_target" and target_name != ".landing_g2h":
                raise AsmParserError(switch.line_num(), f"{switch} does not target landing_g2h")

    def _check_fault_handler(self, test_case: TestCaseProgram) -> None:
        """ check that there is at most one fault handler """
        n_fault_handlers = 0
        for func in test_case.iter_functions():
            for bb in func:
                for inst in bb:
                    if inst.name == "macro" and inst.operands[0].value == ".fault_handler":
                        n_fault_handlers += 1
                    if n_fault_handlers > 1:
                        raise AsmParserError(inst.line_num(), "Found more than one fault handler")

    def _check_set_data_permission(self, test_case: TestCaseProgram) -> None:
        """ check that PT modification happens only in kernel host mode """
        for sec in test_case:
            owner = sec.owner
            for func in sec:
                for bb in func:
                    for inst in bb:
                        if inst.name == "macro" \
                           and inst.operands[0].value == ".set_data_permissions":
                            asm_parser_assert(
                                owner.privilege_level == ActorPL.KERNEL
                                and owner.mode == ActorMode.HOST, inst.line_num(),
                                "PT modification is allowed only in kernel host mode")


================================================
FILE: rvzr/cli.py
================================================
"""
File: Function definitions for using Revizor as command-line tool
(Note: the actual CLI is accessed via revizor.py)

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

import os
import sys
from typing import TYPE_CHECKING, Any
from argparse import ArgumentParser, ArgumentTypeError, ArgumentDefaultsHelpFormatter

import unicorn

from .factory import get_minimizer, get_fuzzer, get_downloader
from .config import CONF
from .logs import update_logging_after_config_change

if TYPE_CHECKING:
    from .fuzzer import FuzzingMode


def _arg2bool(arg: Any) -> bool:
    if isinstance(arg, bool):
        return arg
    if arg.lower() in ('yes', 'true', 't', 'y', '1'):
        return True
    if arg.lower() in ('no', 'false', 'f', 'n', '0'):
        return False
    raise ArgumentTypeError('Boolean value expected.')


def _parse_args() -> Any:  # pylint: disable=r0915
    parser = ArgumentParser(add_help=False)
    subparsers = parser.add_subparsers(dest='subparser_name')
    subparsers.required = True

    # ==============================================================================================
    # Common arguments
    common_parser = ArgumentParser(add_help=False)
    common_parser.add_argument(
        "-c",
        "--config",
        type=str,
        required=False,
        help="Path to the configuration file (YAML) that will be used during fuzzing.",
    )
    common_parser.add_argument(
        "-I",
        "--include-dir",
        type=str,
        default=".",
        required=False,
        help="Path to the directory containing configuration files that included by the main "
        " configuration file (received via --config).",
    )
    common_parser.add_argument(
        "-s",
        "--instruction-set",
        type=str,
        required=True,
        help="Path to the instruction set specification (JSON) file.",
    )

    # ==============================================================================================
    # Fuzzing
    parser_fuzz = subparsers.add_parser(
        'fuzz',
        add_help=True,
        parents=[common_parser],
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_fuzz.add_argument(
        "-n",
        "--num-test-cases",
        type=int,
        default=1,
        help="Number of test cases.",
    )
    parser_fuzz.add_argument(
        "-i",
        "--num-inputs",
        type=int,
        default=100,
        help="Number of inputs per test case.",
    )
    parser_fuzz.add_argument(
        '-w',
        '--working-directory',
        type=str,
        default='.',
    )
    parser_fuzz.add_argument(
        '-t',
        '--testcase',
        type=str,
        default=None,
        help="Use an existing test case [DEPRECATED - see reproduce]")
    parser_fuzz.add_argument(
        '--timeout',
        type=int,
        default=0,
        help="Run fuzzing with a time limit [seconds]. No timeout when set to zero.")
    parser_fuzz.add_argument(
        '--nonstop', action='store_true', help="Don't stop after detecting an unexpected result")
    parser_fuzz.add_argument(
        '--save-violations',
        type=_arg2bool,
        default=True,
        help="If set, store all detected violations in working directory.",
    )

    # ==============================================================================================
    # Template-based fuzzing
    parser_tfuzz = subparsers.add_parser(
        'tfuzz',
        add_help=True,
        parents=[common_parser],
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_tfuzz.add_argument(
        "-n",
        "--num-test-cases",
        type=int,
        default=1,
        help="Number of test cases.",
    )
    parser_tfuzz.add_argument(
        "-i",
        "--num-inputs",
        type=int,
        default=100,
        help="Number of inputs per test case.",
    )
    parser_tfuzz.add_argument(
        '-w',
        '--working-directory',
        type=str,
        default='',
    )
    parser_tfuzz.add_argument(
        '-t',
        '--template',
        type=str,
        required=True,
        help="The template to use for generating test cases")
    parser_tfuzz.add_argument(
        '--timeout',
        type=int,
        default=0,
        help="Run fuzzing with a time limit [seconds]. No timeout when set to zero.")
    parser_tfuzz.add_argument(
        '--nonstop', action='store_true', help="Don't stop after detecting an unexpected result")
    parser_tfuzz.add_argument(
        '--save-violations',
        type=_arg2bool,
        default=True,
        help="If set, store all detected violations in working directory.",
    )

    # ==============================================================================================
    # Standalone interface to trace analysis
    parser_analyser = subparsers.add_parser(
        'analyse',
        add_help=True,
        parents=[common_parser],
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_analyser.add_argument(
        '--ctraces',
        type=str,
        required=True,
    )
    parser_analyser.add_argument(
        '--htraces',
        type=str,
        required=True,
    )

    # ==============================================================================================
    # Reproducing violation
    parser_reproduce = subparsers.add_parser(
        'reproduce',
        add_help=True,
        parents=[common_parser],
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_reproduce.add_argument(
        '-t',
        '--testcase',
        type=str,
        default=None,
        required=True,
        help="Path to the test case",
    )
    parser_reproduce.add_argument(
        '-i',
        '--inputs',
        type=str,
        nargs='*',
        default=None,
        help="Path to the directory with inputs")
    parser_reproduce.add_argument(
        "-n",
        "--num-inputs",
        type=int,
        default=100,
        help="Number of inputs per test case. [IGNORED if --inputs is set]",
    )

    # ==============================================================================================
    # Postprocessing interface
    parser_mini = subparsers.add_parser(
        'minimize',
        add_help=True,
        parents=[common_parser],
        help="Minimize a test case by executing a series of minimization passes. "
        "The set of passes is controlled via CLI arguments.",
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_mini.add_argument(
        '--testcase',
        '-t',
        type=str,
        required=True,
        help="Path to the test case program that needs to be minimized.",
    )
    parser_mini.add_argument(
        "-i",
        "--num-inputs",
        type=int,
        required=True,
        help="Number of inputs to the program that will be used during minimization.",
    )
    parser_mini.add_argument(
        '--testcase-outfile',
        '-o',
        type=str,
        required=True,
        help="Output path for the minimized test case program.",
    )
    parser_mini.add_argument(
        '--input-outdir',
        type=str,
        default=None,
        help="Output directory for storing minimized inputs.",
    )
    parser_mini.add_argument(
        '--num-attempts',
        type=int,
        default=1,
        help="Number of attempts to minimize the test case.",
    )
    parser_mini.add_argument(
        '--enable-instruction-pass',
        type=_arg2bool,
        default=True,
        help="Enable the instruction minimization pass that iteratively removes "
        "instructions while preserving the violation.",
    )
    parser_mini.add_argument(
        '--enable-simplification-pass',
        type=_arg2bool,
        default=False,
        help="Enable the instruction simplification pass that replaces complex "
        "instructions with simpler ones while preserving the violation.",
    )
    parser_mini.add_argument(
        '--enable-nop-pass',
        type=_arg2bool,
        default=False,
        help="Enable the NOP replacement pass that replaces instructions with NOPs "
        "while preserving the violation.",
    )
    parser_mini.add_argument(
        '--enable-constant-pass',
        type=_arg2bool,
        default=False,
        help="Enable the constant simplification pass that replaces constants with 0s "
        "while preserving the violation.",
    )
    parser_mini.add_argument(
        '--enable-mask-pass',
        type=_arg2bool,
        default=False,
        help="Enable the mask simplification pass that reduces the size of instrumentation "
        "masks while preserving the violation.",
    )
    parser_mini.add_argument(
        '--enable-label-pass',
        type=_arg2bool,
        default=True,
        help="Enable the label removal pass that removes unused labels from the assembly file.",
    )
    parser_mini.add_argument(
        '--enable-fence-pass',
        type=_arg2bool,
        default=False,
        help="Enable the fence insertion pass that adds LFENCEs after instructions "
        "while preserving the violation.",
    )
    parser_mini.add_argument(
        "--enable-input-seq-pass",
        type=_arg2bool,
        default=False,
        help="Enable the input sequence minimization pass that removes inputs from "
        "the original generated sequence while preserving the violation.",
    )
    parser_mini.add_argument(
        "--enable-input-diff-pass",
        type=_arg2bool,
        default=False,
        help="Enable the violating input difference minimization pass that removes "
        "inputs that do not contribute to the violation.",
    )
    parser_mini.add_argument(
        "--enable-comment-pass",
        type=_arg2bool,
        default=False,
        help="Enable the violation comment pass that adds comments to the assembly file "
        "with details about the violation.",
    )

    # ==============================================================================================
    # Standalone interface to test case generation
    parser_generator = subparsers.add_parser(
        'generate',
        add_help=True,
        parents=[common_parser],
        formatter_class=ArgumentDefaultsHelpFormatter)
    parser_generator.add_argument(
        "-r",
        "--seed",
        type=int,
        default=0,
        help="Add seed to generate test case.",
    )
    parser_generator.add_argument(
        "-n",
        "--num-test-cases",
        type=int,
        default=5,
        help="Number of test cases.",
    )
    parser_generator.add_argument(
        "-i",
        "--num-inputs",
        type=int,
        default=100,
        help="Number of inputs per test case.",
    )
    parser_generator.add_argument(
        '-w',
        '--working-directory',
        type=str,
        default='',
    )
    parser_generator.add_argument(
        '--permit-overwrite',
        action='store_true',
    )

    # ==============================================================================================
    # Loading of ISA specs
    parser_get_isa = subparsers.add_parser('download_spec', add_help=True)
    parser_get_isa.add_argument("-a", "--architecture", type=str, required=True)
    parser_get_isa.add_argument(
        '--outfile',
        '-o',
        type=str,
        required=True,
    )
    parser_get_isa.add_argument("--extensions", nargs="*", default=[])
    return parser.parse_args()


def main() -> int:  # pylint: disable=r0911,r0912,r0915  # this function is necessarily complex
    """
    Parse command-line arguments and launch the fuzzer in the requested mode.
    """
    args = _parse_args()

    # Update configuration
    if getattr(args, 'config', None):
        CONF.load(args.config, args.include_dir)
    if getattr(args, 'testcase', None):
        CONF.disable_generation()
    update_logging_after_config_change()

    # Check if the file and directory arguments are valid
    if getattr(args, 'testcase', None) and not os.path.isfile(args.testcase):
        print("[ERROR]", f"The test case file `{args.testcase}` does not exist")
        return 1
    if getattr(args, 'working_directory', None) and not os.path.isdir(args.working_directory):
        print("[ERROR]", f"The working directory `{args.working_directory}` does not exist")
        return 1
    if (getattr(args, 'enable_input_seq_pass', None)
        or getattr(args, 'enable_input_diff_pass', None)) \
            and not args.input_outdir:
        print(
            "[ERROR]", "Passes --enable-input-seq-pass and --enable-input-diff-pass "
            "require flag --input-outdir to be set.")
        return 1

    # Enforce the Unicorn version: New versions of Unicorn have a bug that causes false positives
    # in the fuzzer. This is a temporary workaround until the bug is fixed.
    if unicorn.__version__ != '1.0.3' and CONF.instruction_set == 'x86-64':  # type: ignore
        print(
            "[ERROR]", "The fuzzer requires Unicorn version 1.0.3. Please install it using "
            "`pip install unicorn==1.0.3`.")
        return 1

    # Fuzzing
    if args.subparser_name in ('fuzz', 'tfuzz'):
        testcase = args.testcase if args.subparser_name == 'fuzz' else args.template
        fuzzer = get_fuzzer(args.instruction_set, args.working_directory, testcase, None)
        type_: FuzzingMode
        if args.subparser_name == 'tfuzz':
            type_ = 'template'
        elif testcase:
            type_ = 'asm'
        else:
            type_ = 'random'
        exit_code = fuzzer.start(
            args.num_test_cases,
            args.num_inputs,
            args.timeout,
            args.nonstop,
            args.save_violations,
            type_=type_)
        return exit_code

    # Reproducing a violation
    if args.subparser_name == 'reproduce':
        fuzzer = get_fuzzer(args.instruction_set, "", args.testcase, args.inputs)
        exit_code = fuzzer.start(1, args.num_inputs, 0, False, False, type_='asm')
        return exit_code

    # Stand-alone generation
    if args.subparser_name == "generate":
        fuzzer = get_fuzzer(args.instruction_set, args.working_directory, "", None)
        fuzzer.standalone_generate(args.seed, args.num_test_cases, args.num_inputs,
                                   args.permit_overwrite)
        return 0

    # Trace analysis
    if args.subparser_name == 'analyse':
        fuzzer = get_fuzzer(args.instruction_set, "", "", None)
        fuzzer.standalone_analyse(args.ctraces, args.htraces)
        return 0

    # Test case minimization
    if args.subparser_name == "minimize":
        if (args.enable_input_seq_pass or args.enable_input_diff_pass) and not args.input_outdir:
            raise SystemExit("ERROR: Passes --enable-input-seq-pass and --enable-input-diff-pass \n"
                             "require flag --input_outdir to be set.")

        fuzzer = get_fuzzer(args.instruction_set, "", args.testcase, None)
        minimizer = get_minimizer(fuzzer, args.instruction_set)
        minimizer.run(
            test_case_asm=args.testcase,
            n_inputs=args.num_inputs,
            test_case_outfile=args.testcase_outfile,
            input_outdir=args.input_outdir,
            n_attempts=args.num_attempts,
            enable_instruction_pass=args.enable_instruction_pass,
            enable_simplification_pass=args.enable_simplification_pass,
            enable_nop_pass=args.enable_nop_pass,
            enable_constant_pass=args.enable_constant_pass,
            enable_mask_pass=args.enable_mask_pass,
            enable_label_pass=args.enable_label_pass,
            enable_fence_pass=args.enable_fence_pass,
            enable_input_seq_pass=args.enable_input_seq_pass,
            enable_input_diff_pass=args.enable_input_diff_pass,
            enable_comment_pass=args.enable_comment_pass,
        )
        return 0

    if args.subparser_name == "download_spec":
        get_downloader(args.architecture, args.extensions, args.outfile).run()  # type: ignore
        return 0

    print("[ERROR]", "Invalid subcommand")
    return 1


if __name__ == '__main__':
    print("[ERROR]", "This file is not meant to be run directly. Use `revizor.py` instead.")
    sys.exit(1)


================================================
FILE: rvzr/code_generator.py
================================================
"""
File: Test Case Generation

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import random
import re
from typing import TYPE_CHECKING, List, Tuple, Optional, Final, Callable, Dict, TextIO, Iterable
from subprocess import CalledProcessError, run
from copy import deepcopy
from abc import ABC, abstractmethod

from .tc_components.actor import Actor
from .tc_components.instruction import Instruction, RegisterOp, FlagsOp, MemoryOp, \
    ImmediateOp, AgenOp, LabelOp, CondOp, AnyOperand
from .tc_components.test_case_code import TestCaseProgram, Function, BasicBlock, CodeSection, \
    TC_EXIT_LABEL
from .instruction_spec import OT
from .logs import GeneratorLogger, error, inform
from .config import CONF, ActorsConf

if TYPE_CHECKING:
    from .tc_components.test_case_code import InstructionNode
    from .target_desc import TargetDesc
    from .asm_parser import AsmParser
    from .instruction_spec import InstructionSpec, OperandSpec
    from .isa_spec import InstructionSet
    from .elf_parser import ELFParser


# ==================================================================================================
# Interfaces and common functionality of ISA-specific service classes
# ==================================================================================================
class Pass(ABC):
    """
    Interface to an instrumentation pass that modifies a generated test case
    """

    @abstractmethod
    def run_on_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Run the pass on all instructions in a given test case
        """


class Printer(ABC):
    """
    Interface to an ISA-specific assembly printer; that is, a class that prints
    a valid assembly representation of a test case
    """

    prologue_template: List[str]
    """ List of lines that must be printed at the beginning of the assembly file """

    epilogue_template: List[str]
    """ List of lines that must be printed at the end of the assembly file """

    def __init__(self, target_desc: TargetDesc) -> None:
        self.target_desc = target_desc

    def print(self, test_case: TestCaseProgram) -> None:
        """
        Print the assembly representation of a test case to a file associated with the test case
        (i.e., test_case.asm_file)

        :param test_case: The test case to print
        """
        with open(test_case.asm_path(), "w") as f:
            for line in self.prologue_template:
                f.write(line)

            for section in test_case:
                self._print_section(section, f)

            for line in self.epilogue_template:
                f.write(line)

    def _print_section(self, sec: CodeSection, file_: TextIO) -> None:
        file_.write(f".section .data.{sec.name}\n")
        for func in sec:
            self._print_function(func, file_)

    def _print_function(self, func: Function, file_: TextIO) -> None:
        file_.write(f"{func.name}:\n")
        for bb in func:
            self._print_basic_block(bb, file_)

        self._print_basic_block(func.get_exit_bb(), file_)

    def _print_basic_block(self, bb: BasicBlock, file_: TextIO) -> None:
        file_.write(f"{bb.name.lower()}:\n")
        for inst in bb:
            file_.write(self._instruction_to_str(inst) + "\n")
        for inst in bb.terminators:
            file_.write(self._instruction_to_str(inst) + "\n")

    @abstractmethod
    def _instruction_to_str(self, inst: Instruction) -> str:
        """ Convert an instruction object to its assembly representation """

    @abstractmethod
    def _operand_to_str(self, op: AnyOperand) -> str:
        """ Convert an operand object to its assembly representation """

    @abstractmethod
    def _macro_to_str(self, inst: Instruction) -> str:
        """ Convert a macro instruction object to its assembly representation """


# ==================================================================================================
# ISA-independent Code Generator
# ==================================================================================================
class CodeGenerator(ABC):
    """
    ISA-independent implementation of the class responsible for generating test case code.

    Some of the methods are abstract and must be implemented by the ISA-specific subclasses.
    """

    _instruction_set: InstructionSet  # Specification of the tested instruction set
    _target_desc: TargetDesc  # Description of the tested architecture
    _asm_parser: AsmParser  # Parser for assembly files
    _elf_parser: ELFParser  # Parser for ELF files
    _passes: List[Pass]  # List of passes to run on the generated test case; set by subclasses
    _printer: Printer  # Printer for the generated test case; set by subclasses

    _state: int = 0  # Current seed value
    _cached_template: Optional[TestCaseProgram] = None  # Parsed template assembly file

    _function_generator: Final[_FunctionGenerator]
    _instruction_generator: Final[_InstructionGenerator]

    __log: Final[GeneratorLogger]

    def __init__(self, seed: int, instruction_set: InstructionSet, target_desc: TargetDesc,
                 asm_parser: AsmParser, elf_parser: ELFParser) -> None:
        self._instruction_set = instruction_set
        self._target_desc = target_desc
        self._asm_parser = asm_parser
        self._elf_parser = elf_parser
        self._set_seed(seed)

        self.__log = GeneratorLogger()
        self.__log.dbg_dump_instruction_pool(instruction_set.instructions)
        self._passes = []

        self._function_generator = _FunctionGenerator(self._target_desc, instruction_set)
        self._instruction_generator = _InstructionGenerator(self._target_desc)

    # ----------------------------------------------------------------------------------------------
    # Public Interface
    def create_test_case(self, asm_file: str, disable_assembler: bool = False) -> TestCaseProgram:
        """
        Generate a random test case, write its assembly code to a file,
        and assemble it into an object (unless disabled).
        :param asm_file: the path to the output file
        :param disable_assembler: if True, the function will not assemble the test case
        :return: the generated test case object
        """
        if not asm_file:
            asm_file = 'generated.asm'
        test_case = TestCaseProgram(asm_file, seed=self._state)

        # create actors and their corresponding sections
        actors_config: ActorsConf = CONF.get_actors_conf()
        if len(actors_config) != 1:
            error("Generation of test cases with multiple actors is not yet supported")
        self.generate_actors_with_sections(test_case, actors_config)

        # create empty main function and fill it with random instructions
        main_section = test_case[0]
        default_actor = main_section.owner
        assert default_actor.is_main
        main_func = self._function_generator.generate_empty(".function_0", main_section)
        self._function_generator.fill_function(main_func)

        # add it to the test case, in the first section
        test_case[0].append(main_func)

        # process the test case
        for p in self._passes:
            p.run_on_test_case(test_case)

        # add symbols to test case
        self._add_required_symbols(test_case)

        self._printer.print(test_case)

        if disable_assembler:
            return test_case

        test_case.assign_obj(asm_file[:-4] + ".o")
        assemble(test_case)
        self._elf_parser.populate_elf_data(test_case.get_obj(), test_case)

        self._update_state()
        return test_case

    def create_test_case_from_template(self, template_file: str) -> TestCaseProgram:
        """
        Generate a test case based on a template by expanding RANDOM_* macros.
        Run instrumentation _passes and print the result into a file

        :param template_file: The path to the template file
        :return: The generated test case object
        :raises FileNotFoundError: if the template file does not exist
        :raises CalledProcessError: if the assembler fails to assemble the test case
        """
        # create a TestCaseProgram object from the template file
        if self._cached_template:
            test_case = deepcopy(self._cached_template)
            test_case.generator_seed = self._state
        else:
            test_case = self._asm_parser.parse_file(
                template_file, self, self._elf_parser, is_template=True)
            test_case.generator_seed = self._state
            self._cached_template = deepcopy(test_case)

        # Label all instructions from the template as such
        for func in test_case.iter_functions():
            for bb in func:
                for instr in bb:
                    instr.is_from_template = True

        # Expand the template
        self._set_seed(self._state)  # reset the seed in case it was updated by other modules
        self._expand_template(test_case, CONF.get_actors_conf())
        for p in self._passes:
            p.run_on_test_case(test_case)

        # Print into assembly and assemble into an object file
        asm_file = 'generated.asm'
        test_case.reassign_asm_file(asm_file)
        self._printer.print(test_case)

        test_case.assign_obj(asm_file[:-4] + ".o")
        assemble(test_case)
        self._elf_parser.populate_elf_data(test_case.get_obj(), test_case)

        self._update_state()
        return test_case

    def generate_actors_with_sections(self, test_case: TestCaseProgram,
                                      actors_dict: ActorsConf) -> None:
        """
        Stand-alone interface to create actors for the given test case and
        populate them with the corresponding sections.

        NOTE: This method leaves the sections *empty*; i.e., it does not populate the test case
        with functions, basic blocks, and instructions.

        :param test_case: The test case to which the actors will be added
        :param actors_dict: The configuration of the actors
        :return: None
        """
        for name, actor_dict in actors_dict.items():
            actor = Actor.from_dict(actor_dict, self._target_desc)

            # add the actor to the test case
            if name == "main":  # the main actor is created by default; overwrite it
                test_case.add_actor_with_section(actor, allow_overwrite=True)
            else:  # all other actors should not exist yet
                test_case.add_actor_with_section(actor)

    def generate_instruction(self,
                             spec: InstructionSpec,
                             is_instrumentation: Optional[bool] = None) -> Instruction:
        """
        Stand-alone interface to generate a random instruction based on the specification.

        :param spec: The specification of the instruction
        :return: The generated instruction
        """
        # To correctly inherit the default value of is_instrumentation from the instruction
        # generator, we have two separate calls
        if is_instrumentation is None:
            return self._instruction_generator.generate(spec)
        return self._instruction_generator.generate(spec, is_instrumentation)

    # ----------------------------------------------------------------------------------------------
    # Private: Seed Management
    def _set_seed(self, seed: int) -> None:
        """
        Set the seed value used to generate test programs
        :param seed: The seed value
        """
        if seed == 0:
            seed = random.randint(1, 1000000)
            inform("prog_gen", f"Setting program_generator_seed to random value: {seed}")
        self._state = seed
        random.seed(self._state)

    def _update_state(self) -> None:
        self._state += 1
        random.seed(self._state)

    # ----------------------------------------------------------------------------------------------
    # Private: Misc.
    def _add_required_symbols(self, test_case: TestCaseProgram) -> None:
        # add measurement_start and measurement_end symbols
        sec_main = test_case[0]
        assert sec_main.owner.is_main
        func_main = sec_main[0]

        bb_first = func_main[0]
        instr = Instruction("macro", category="MACRO") \
            .add_op(LabelOp(".measurement_start")) \
            .add_op(LabelOp(".noarg"))
        bb_first.insert_before(bb_first.get_first(), instr)

        bb_last = func_main.get_exit_bb()
        instr = Instruction("macro", category="MACRO") \
            .add_op(LabelOp(".measurement_end")) \
            .add_op(LabelOp(".noarg"))
        bb_last.insert_after(bb_last.get_last(), instr)

    def _expand_template(self, test_case: TestCaseProgram, actors_config: ActorsConf) -> None:
        nodes_to_expand: List[Tuple[InstructionNode, str]] = []

        # find all instances of .macro.random_instructions
        for bb in test_case.iter_basic_blocks():
            for node in bb.iter_nodes():
                inst = node.instruction
                if inst.name == "macro" and inst.operands[0].value == ".random_instructions":
                    nodes_to_expand.append((node, bb.get_owner().name))

        # replace all instances of .macro.random_instructions with random instructions
        for node, actor_name in nodes_to_expand:
            inst = node.instruction
            bb = node.parent
            operands = inst.operands[1].value.split(".")
            assert len(operands) >= 3 and len(operands) <= 5
            n_instr = int(operands[1])
            n_mem = int(operands[2])

            # determine the instruction set for this actor
            block = actors_config[actor_name]["instruction_blocklist"]
            non_memory_access_instructions = \
                [i for i in self._instruction_set.non_memory_access_specs if i.name not in block]
            store_instructions = \
                [i for i in self._instruction_set.store_instructions if i.name not in block]
            load_instruction = \
                [i for i in self._instruction_set.load_instruction if i.name not in block]

            # replace the macro with random instructions
            bb.delete(node)
            for _ in range(n_instr):
                inst = self._instruction_generator.generate_from_random_spec(
                    non_memory_access_instructions=non_memory_access_instructions,
                    store_instructions=store_instructions,
                    load_instructions=load_instruction,
                    memory_access_probability=n_mem / n_instr)
                if node.previous:
                    bb.insert_after(node.previous, inst)
                else:
                    bb.insert_before(bb.get_first(), inst)


def assemble(test_case: TestCaseProgram) -> None:
    """
    Assemble an assembly file into an object file and creates a stripped binary
    :param test_case: The test case to be assembled
    """

    def pretty_error_msg(error_msg: str) -> str:
        with open(asm_file, "r") as f:
            lines = f.read().split("\n")

        msg = "Error appeared while assembling the test case:\n"
        for line in error_msg.split("\n"):
            line = line.removeprefix(asm_file + ":")
            line_num_str = re.search(r"(\d+):", line)
            if not line_num_str:
                msg += line
            else:
                parsed = lines[int(line_num_str.group(1)) - 1]
                msg += f"\n  Line {line}\n    (the line was parsed as {parsed})"
        return msg

    asm_file = test_case.asm_path()
    obj_container = test_case.get_obj()
    obj_file = obj_container.obj_path

    try:
        out = run(f"as {asm_file} -o {obj_file}", shell=True, check=True, capture_output=True)
    except CalledProcessError as e:
        error_msg = e.stderr.decode()
        if "Assembler messages:" in error_msg:
            print(pretty_error_msg(error_msg))
        else:
            print(error_msg)
        exit(1)
    finally:
        pass
        # run(f"rm {patched_asm_file}", shell=True, check=True)

    output = out.stderr.decode()
    if "Assembler messages:" in output:
        print("WARNING: [generator]" + pretty_error_msg(output))

    obj_container.mark_as_assembled()


# ==================================================================================================
# Private Service Classes
# ==================================================================================================
class _FunctionGenerator:
    """ Class responsible for generating random functions """

    _instruction_generator: _InstructionGenerator
    _isa_spec: InstructionSet

    def __init__(self, target_desc: TargetDesc, isa_spec: InstructionSet) -> None:
        self._instruction_generator = _InstructionGenerator(target_desc)
        self._isa_spec = isa_spec

    def generate_empty(self, label: str, parent: CodeSection) -> Function:
        """ Generates an empty function with a random DAG of basic blocks """
        func = Function(label, parent)

        # Define the maximum allowed number of successors for any BB
        if self._isa_spec.has_conditional_branch:
            max_successors = CONF.max_successors_per_bb if CONF.max_successors_per_bb < 2 else 2
            min_successors = CONF.min_successors_per_bb if CONF.min_successors_per_bb < 2 else 2
            assert min_successors <= max_successors, "min_successors_per_bb > max_successors_per_bb"
        else:
            max_successors = 1
            min_successors = 1

        # Create basic blocks
        if CONF.min_bb_per_function == CONF.max_bb_per_function:
            node_count = CONF.min_bb_per_function
        else:
            node_count = random.randint(CONF.min_bb_per_function, CONF.max_bb_per_function)
        func_name = label.removeprefix(".function_")
        nodes = [BasicBlock(f".bb_{func_name}.{i}", func) for i in range(node_count)]

        # Connect BBs into a graph
        for i in range(node_count):
            current_bb = nodes[i]

            # the last node has only one successor - exit
            if i == node_count - 1:
                current_bb.successors = [func.get_exit_bb()]
                break

            # the rest of the node have a random number of successors
            successor_count = random.randint(min_successors, max_successors)
            if successor_count + i > node_count:
                # the number is adjusted to the position when close to the end
                successor_count = node_count - i

            # one of the targets (the first successor) is always the next node - to avoid dead code
            current_bb.successors.append(nodes[i + 1])

            # all other successors are random, selected from next nodes
            options = nodes[i + 2:]
            options.append(func.get_exit_bb())
            for _ in range(1, successor_count):
                target = random.choice(options)
                options.remove(target)
                current_bb.successors.append(target)

        # Function returns are not yet supported
        # hence all functions end with an unconditional jump to the exit
        inst = self._instruction_generator.generate(self._isa_spec.get_unconditional_jump_spec())
        assert isinstance(inst.operands[0], LabelOp)
        inst.operands[0].value = TC_EXIT_LABEL
        func.get_exit_bb().terminators = [inst]

        # Finalize the function
        func.extend(nodes)
        return func

    def fill_function(self, func: Function) -> None:
        """
        Fill an (assumed empty) function with random instructions
        :param func: the function to fill
        :return: None
        :raises AssertionError: if the function is not empty
        :raises NotImplementedError: if one of the basic blocks has more than two successors
        """
        self._add_terminators_in_function(func)
        self._add_instructions_in_function(func)

    def _add_terminators_in_function(self, func: Function) -> None:

        def add_fallthrough(bb: BasicBlock, destination: BasicBlock) -> None:
            # create an unconditional branch and add it
            terminator_spec = self._isa_spec.get_unconditional_jump_spec()
            terminator = self._instruction_generator.generate(terminator_spec)
            label = terminator.get_label_operand()
            assert label is not None
            label.value = destination.name
            bb.terminators.append(terminator)

        for bb in func:
            assert not bb.terminators, "Basic block already has terminators"
            if len(bb.successors) == 0:
                # Return instruction
                continue

            if len(bb.successors) == 1:
                # Unconditional branch
                dest = bb.successors[0]
                if dest.is_exit:
                    # DON'T insert a branch to the exit
                    # the last basic block always falls through implicitly
                    continue
                add_fallthrough(bb, dest)
                continue

            if len(bb.successors) == 2:
                # Conditional branch
                spec = random.choice(self._isa_spec.cond_branches)
                terminator = self._instruction_generator.generate(spec)
                label = terminator.get_label_operand()
                assert label
                label.value = bb.successors[0].name
                bb.terminators.append(terminator)

                add_fallthrough(bb, bb.successors[1])
                continue

            # > 2 successors
            raise NotImplementedError("Indirect jumps/calls are not yet supported")

    def _add_instructions_in_function(self, func: Function) -> None:
        """
        Fill the function with random instructions.
        Ensures that all basic blocks are filled with roughly the same number of instructions
        :param func: the function to fill
        :return: None
        """
        bb_list: List[BasicBlock] = list(func)
        assert all(len(bb) == 0 for bb in bb_list), "Basic blocks are not empty"
        for _ in range(0, CONF.program_size):
            bb = random.choice(bb_list)
            inst = self._instruction_generator.generate_from_random_spec(
                self._isa_spec.non_memory_access_specs, self._isa_spec.store_instructions,
                self._isa_spec.load_instruction, CONF.avg_mem_accesses / CONF.program_size)
            bb.insert_after(bb.get_last(), inst)


class _InstructionGenerator:
    """
    Class responsible for generating random instructions
    """

    _operand_generator: _OperandGenerator

    def __init__(self, target_desc: TargetDesc) -> None:
        self._operand_generator = _OperandGenerator(target_desc)

    def generate(self, spec: InstructionSpec, is_instrumentation: bool = False) -> Instruction:
        """
        Generate a random instruction object based on the specification
        :param spec: The specification of the instruction
        :param is_instrumentation: Whether to label the instruction as instrumentation
        :return: The generated instruction
        """

        # fill up with random operands, following the spec
        inst = Instruction.from_spec(spec, is_instrumentation=is_instrumentation)

        # generate explicit operands
        for operand_spec in spec.operands:
            operand = self._operand_generator.generate(operand_spec, inst)
            inst.operands.append(operand)

        # generate implicit operands
        for operand_spec in spec.implicit_operands:
            operand = self._operand_generator.generate(operand_spec, inst)
            inst.implicit_operands.append(operand)

        return inst

    def generate_from_random_spec(self,
                                  non_memory_access_instructions: List[InstructionSpec],
                                  store_instructions: List[InstructionSpec],
                                  load_instructions: List[InstructionSpec],
                                  memory_access_probability: float = 0.0) -> Instruction:
        """
        Generate an instruction from a randomly-selected specification
        :param non_memory_access_instructions: The list of available non-memory access instructions
        :param store_instructions: The list of available store instructions
        :param load_instructions: The list of available load instructions
        :return: The generated instruction
        """

        def pick_spec() -> InstructionSpec:
            # ensure the requested avg. number of mem. accesses
            search_for_memory_access = random.random() < memory_access_probability
            if not search_for_memory_access:
                return random.choice(non_memory_access_instructions)

            if store_instructions:
                search_for_store = random.random() < 0.5  # 50% probability of stores
            else:
                search_for_store = False

            if search_for_store:
                return random.choice(store_instructions)

            return random.choice(load_instructions)

        spec = pick_spec()
        return self.generate(spec)


class _OperandGenerator:
    """
    Class responsible for generating random operands for instructions
    """

    def __init__(self, target_desc: TargetDesc) -> None:
        self.target_desc = target_desc

    def generate(self, spec: OperandSpec, parent: Instruction) -> AnyOperand:
        """
        Generate a random operand object based on the specification
        """
        generators: Dict[OT, Callable[[OperandSpec, Instruction], AnyOperand]] = {
            OT.REG: self._generate_reg_operand,
            OT.MEM: self._generate_mem_operand,
            OT.IMM: self._generate_imm_operand,
            OT.LABEL: self._generate_label_operand,
            OT.AGEN: self._generate_agen_operand,
            OT.FLAGS: self._generate_flags_operand,
            OT.COND: self._generate_cond_operand,
        }
        return generators[spec.type](spec, parent)

    def _generate_reg_operand(self, spec: OperandSpec, _: Instruction) -> RegisterOp:
        choices = spec.values
        reg = random.choice(choices)
        return RegisterOp(reg, spec.width, spec.src, spec.dest)

    def _generate_mem_operand(self, spec: OperandSpec, _: Instruction) -> MemoryOp:
        if spec.values:
            address_reg = random.choice(spec.values)
        else:
            address_reg = random.choice(self.target_desc.mem_index_registers)
        return MemoryOp(address_reg, spec.width, spec.src, spec.dest)

    def _generate_imm_operand(self, spec: OperandSpec, inst: Instruction) -> ImmediateOp:
        # generate bitmask
        if spec.values and spec.values[0] == "bitmask":
            return self._generate_bitmask_operand(spec, inst)

        # generate from a predefined list
        if spec.values and "[" not in spec.values[0]:
            options: Iterable[str] | Iterable[int]
            try:
                options = [int(v) for v in spec.values]
            except ValueError:
                # handle non-digit immediates (e.g., dsb SY in ARM64)
                options = list(spec.values)
            value = str(random.choice(options))
            return ImmediateOp(value, spec.width)

        # generate from a predefined range
        if spec.values:
            assert "[" in spec.values[0], f"Invalid IMM spec for instruction: {inst}"
            range_ = spec.values[0][1:-1].split("-")
            if range_[0] == "":
                range_ = range_[1:]
                range_[0] = "-" + range_[0]
            assert len(range_) == 2
            value = str(random.randint(int(range_[0]), int(range_[1])))
            return ImmediateOp(value, spec.width)

        # generate from width
        if spec.is_signed:
            range_min = pow(2, spec.width - 1) * -1
            range_max = pow(2, spec.width - 1) - 1
        else:
            range_min = 0
            range_max = pow(2, spec.width) - 1
        value = str(random.randint(range_min, range_max))
        return ImmediateOp(value, spec.width)

    def _generate_bitmask_operand(self, spec: OperandSpec, _: Instruction) -> ImmediateOp:
        assert CONF.instruction_set == "arm64"

        if spec.width == 64:
            imms_zero_pos = random.randint(1, 6)
        else:
            imms_zero_pos = random.randint(1, 5)
        imms_ones = random.randint(1, 2**imms_zero_pos - 1)

        immr = random.randint(0, spec.width - 1)

        pattern = "0" * (2**imms_zero_pos - imms_ones) + "1" * imms_ones
        multiplier = spec.width // (2**imms_zero_pos)
        value_str = pattern * multiplier
        value = int(value_str, 2)
        value = (value >> immr) | (value << (spec.width - immr)) & (2**spec.width - 1)

        if spec.width == 64:
            value_str = f"0x{value:016x}"
        else:
            value_str = f"0x{value:08x}"
        return ImmediateOp(value_str, spec.width)

    def _generate_label_operand(self, _: OperandSpec, __: Instruction) -> LabelOp:
        return LabelOp("")  # the actual label will be set in add_terminators_in_function

    def _generate_agen_operand(self, spec: OperandSpec, __: Instruction) -> AgenOp:
        n_operands = random.randint(1, 3)
        reg1 = random.choice(self.target_desc.mem_index_registers)
        if n_operands == 1:
            return AgenOp(reg1, spec.width)

        reg2 = random.choice(self.target_desc.mem_index_registers)
        if n_operands == 2:
            return AgenOp(reg1 + " + " + reg2, spec.width)

        imm = str(random.randint(0, pow(2, 16) - 1))
        return AgenOp(reg1 + " + " + reg2 + " + " + imm, spec.width)

    def _generate_flags_operand(self, spec: OperandSpec, parent: Instruction) -> FlagsOp:
        # pylint: disable=too-many-branches
        # NOTE: there are many options for COND flags, so many branches are needed

        cond_op = parent.get_cond_operand()
        if not cond_op:
            return FlagsOp(spec.values)
        raise NotImplementedError("COND operand is not yet supported")
        # pylint: disable=unreachable
        # NOTE: the code below is temporary disabled

        flag_values = self.target_desc.branch_conditions[cond_op.value]
        if not spec.values:
            return FlagsOp(flag_values)

        # combine implicit flags with the condition
        merged_flags = []
        for flag_pair in zip(flag_values, spec.values):
            if "undef" in flag_pair:
                merged_flags.append("undef")
            elif "r/w" in flag_pair:
                merged_flags.append("r/w")
            elif "w" in flag_pair:
                if "r" in flag_pair:
                    merged_flags.append("r/w")
                else:
                    merged_flags.append("w")
            elif "cw" in flag_pair:
                if "r" in flag_pair:
                    merged_flags.append("r/cw")
                else:
                    merged_flags.append("cw")
            elif "r" in flag_pair:
                merged_flags.append("r")
            else:
                merged_flags.append("")
        return FlagsOp(merged_flags)

    def _generate_cond_operand(self, _: OperandSpec, __: Instruction) -> CondOp:
        cond = random.choice(list(self.target_desc.branch_conditions))
        return CondOp(cond)


================================================
FILE: rvzr/config.py
================================================
"""
File: Fuzzing Configuration Options

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import os
from copy import deepcopy
from collections import OrderedDict
from typing import List, Dict, TextIO, Any, TypedDict, Set, Literal
from types import ModuleType

import yaml

from .arch.x86 import config as x86_config
from .arch.arm64 import config as arm64_config

# ==================================================================================================
# Custom Types
# ==================================================================================================
PagePropertyName = Literal['present', 'writable', 'user', 'write-through', 'cache-disable',
                           'accessed', 'dirty', 'executable', 'reserved_bit', 'randomized']
PageConf = Dict[PagePropertyName, bool]


class ActorConf(TypedDict):
    """ Type definition for actor configuration """
    name: str
    mode: str
    privilege_level: str
    observer: bool
    data_properties: PageConf
    data_ept_properties: PageConf
    instruction_blocklist: Set[str]
    fault_blocklist: Set[str]


ActorConfKey = Literal["name", "mode", "privilege_level", "observer", "data_properties",
                       "data_ept_properties", "instruction_blocklist", "fault_blocklist"]

ActorsConf = Dict[str, ActorConf]

Architecture = Literal["x86-64", "arm64"]


# ==================================================================================================
# Helper classes
# ==================================================================================================
class IncludeLoader(yaml.SafeLoader):
    """
    Helper class to enable `!include` statements in configuration files
    """
    visited: List[str] = []
    file_id_counter: int = 0

    def __init__(self, stream: TextIO, include_dir: str = "") -> None:
        self._search_paths = [os.path.split(stream.name)[0]]
        if include_dir:
            self._search_paths.append(include_dir)
        self.visited.append(os.path.abspath(stream.name))
        super(IncludeLoader, self).__init__(stream)

    def __del__(self) -> None:
        if self.visited:
            self.visited.pop()

    def include(self, node: yaml.Node) -> Any:
        """
        Include another YAML file
        """
        # find the included file
        relative_filename: str = self.construct_scalar(node)  # type: ignore
        for root in self._search_paths:
            filename = os.path.join(root, relative_filename)
            if os.path.exists(filename):
                break
        else:
            raise ConfigException(f"Included file {relative_filename} does not exist")

        # check for cycles
        if os.path.abspath(filename) in self.visited:
            raise ConfigException(f"Circular include detected in {filename}")

        with open(filename, 'r') as f:
            return yaml.load(f, IncludeLoader)

    def construct_yaml_map(self, node: yaml.MappingNode) -> Dict[Any, Any]:
        """
        Custom constructor that renames all `file` keys to `file_<unique_id>` to prevent multiple
        include statements from overwriting each other
        """
        for k, _ in node.value:
            if k.value == 'file':
                k.value = f'file_{self.file_id_counter}'
                self.file_id_counter += 1
        data = self.construct_mapping(node)
        return data


IncludeLoader.add_constructor('!include', IncludeLoader.include)
IncludeLoader.add_constructor(u'tag:yaml.org,2002:map', IncludeLoader.construct_yaml_map)


class ConfigException(SystemExit):

    def __init__(self, message: str) -> None:
        super().__init__("\nCONFIG ERROR: " + message + "\n")


def _get_architecture() -> Architecture:
    with open('/proc/cpuinfo', 'r') as f:
        for line in f:
            if 'AuthenticAMD' in line or 'GenuineIntel' in line:
                return 'x86-64'
            if 'CPU implementer' in line:
                return 'arm64'
        return 'x86-64'


def _get_cpu_vendor() -> str:
    with open('/proc/cpuinfo', 'r') as f:
        for line in f:
            if 'AuthenticAMD' in line:
                return 'x86-64-amd'
            if 'GenuineIntel' in line:
                return 'x86-64-intel'
            if 'CPU implementer' in line:
                return 'arm64'
        return 'x86-64-intel'


# ==================================================================================================
# Main configuration class
# ==================================================================================================
class Conf:
    """
    Data class to store global configuration options. It implements the Borg pattern to ensure that
    all instances share the same state. The configuration options are loaded from a YAML file and
    can be accessed as class attributes.
    """

    # ==============================================================================================
    # Fuzzer
    fuzzer: str = "basic"
    """ fuzzer: type of the fuzzing algorithm """
    enable_priming: bool = True
    """ enable_priming: whether to check violations with priming """
    enable_speculation_filter: bool = False
    """ enable_speculation_filter: if True, discard test cases that don't trigger speculation"""
    enable_observation_filter: bool = False
    """ enable_observation_filter: if True,discard test cases that don't leave speculative traces"""
    enable_fast_path_model: bool = True
    """ enable_fast_path_boosting: if enabled, the same contract trace will be used
    for all inputs in the same taint-based input class """

    # ==============================================================================================
    # Program Generator
    generator: str = "random"
    """ generator: type of the program generator """
    instruction_set: Architecture = _get_architecture()
    """ instruction_set: ISA under test """
    instruction_categories: List[str] = []
    """ instruction_categories: list of instruction categories to use for generating programs """
    instruction_allowlist: List[str] = []
    """ instruction_allowlist: list of instructions to use for generating programs;
    combined with instruction_categories; has priority over instruction_blocklist.
    The resulting list is:
     (instructions from instruction_categories - instruction_blocklist) + instruction_allowlist """
    instruction_blocklist: List[str] = []
    """ instruction_blocklist: list of instruction that will NOT be used for generating programs;
    filters out instructions from instruction_categories, but not from instruction_allowlist.
    The resulting list is:
     (instructions from instruction_categories - instruction_blocklist) + instruction_allowlist """
    instruction_blocklist_append: List[str] = []
    """ instruction_blocklist_append: same as instruction_blocklist, but the list is added
    to the existing blocklist instead of replacing it """
    program_generator_seed: int = 0
    """ program_generator_seed: seed of the program generator; if set to zero, a random seed
    will be used """
    program_size: int = 24
    """ program_size: size of generated programs """
    avg_mem_accesses: int = 12
    """ avg_mem_accesses: average number of memory accesses in generated programs """
    min_bb_per_function: int = 1
    """ min_bb_per_function: minimal number of basic blocks per function in generated programs """
    max_bb_per_function: int = 2
    """ max_bb_per_function: maximum number of basic blocks per function in generated programs """
    min_successors_per_bb: int = 2
    """ min_bb_per_function: min. number of successors for each basic block in generated programs
    Note 1: this config option is a *hint*; it could be ignored if the instruction set does not
    have the necessary instructions to satisfy it, or if a certain number of successor is required
    for correctness"""
    max_successors_per_bb: int = 2
    """ min_bb_per_function: min. number of successors for each basic block in generated programs
    Note: this config option is a *hint*; it could be ignored if the instruction set does not
    have the necessary instructions to satisfy it, or if a certain number of successor is required
    for correctness """
    register_allowlist: List[str] = []
    """ register_allowlist: list of registers that CAN be used for generating programs;
     has higher priority than register_blocklist.
     The resulting list is: (all registers - register_blocklist) + register_allowlist """
    register_blocklist: List[str] = []
    """ register_blocklist: list of registers that will NOT be used for generating programs;
     has lower priority than register_allowlist.
     The resulting list is: (all registers - register_blocklist) + register_allowlist """
    faults_allowlist: List[str] = []
    """ faults_allowlist: by default, generator will produce programs that never
    trigger exceptions. This option modifies this behavior by permitting the generator to produce
    'unsafe' instruction sequences that could potentially trigger an exception. Model and executor
     will also be configured to handle these exceptions gracefully """

    # ==============================================================================================
    # Input Data Generator
    data_generator: str = 'random'
    """ data_generator: type of the input generator """
    data_generator_seed: int = 10
    """ data_generator_seed: input generation seed; will use a random seed if set to zero """
    data_generator_entropy_bits: int = 31
    """ data_generator_entropy_bits: entropy of the random values created by the input generator """
    inputs_per_class: int = 2
    """ inputs_per_class: number of inputs per input class """
    input_gen_probability_of_special_value: float = 0.05
    """ input_gen_probability_of_special_value: probability of generating a special value
    (zero or maximum value) when setting a register value in the input generator. This is used
    to test fast paths in the microarchitecture """

    # ==============================================================================================
    # Contract Model
    model_backend: str = 'unicorn'
    """ model_backend: The backend used to collect contract traces on generated test cases """
    contract_execution_clause: List[str] = ["seq"]
    """ contract_execution_clause: """
    contract_observation_clause: str = 'ct'
    """ contract_observation_clause: """
    model_min_nesting: int = 1
    """ model_max_nesting: """
    model_max_nesting: int = 30
    """ model_max_nesting: """
    model_max_spec_window: int = 250
    """ model_max_spec_window: """

    # ==============================================================================================
    # Executor
    executor: str = _get_cpu_vendor()
    """ executor: executor type """
    executor_mode: str = 'P+P'
    """ executor_mode: hardware trace collection mode """
    executor_warmups: int = 5
    """ executor_warmups: number of warmup rounds executed before starting to collect
    hardware traces """
    executor_sample_sizes: List[int] = [10, 50, 100, 500]
    """ executor_sample_sizes: a list of sample sizes to be used during the measurements;
    the executor will first collect the hardware traces with the first sample size in the list,
    and if a violation is detected, it will try to reproduce it with all the following
    sample sizes """
    executor_filtering_repetitions: int = 10
    """ executor_filtering_repetitions: number of repetitions while filtering test cases """
    executor_taskset: int = 0
    """ executor_taskset: id of the CPU core on which the executor is running test cases """
    enable_pre_run_flush: bool = True
    """ enable_pre_run_flush: if enabled, the executor will do its best to flush
    the microarchitectural state before running test cases """

    # ==============================================================================================
    # Analyser
    analyser: str = 'chi2'
    """ analyser: type of the analyser """
    analyser_subsets_is_violation: bool = False
    """ analyser_subsets_is_violation: [only for analyser='sets' or analyser='bitmaps']
    if False, the analyser will not label hardware traces as mismatching if they form
    a subset relation """
    analyser_outliers_threshold: float = 0.1
    """ analyser_outliers_threshold: [only for analyser='sets' or analyser='bitmaps']
    analyser will ignore the htraces that appear in less then this percentage of the repetitions.
    I.e., a htrace passes the filter if it is observed at least
        (analyser_outliers_threshold * len(htrace)) times """
    analyser_stat_threshold: float = 0.5
    """ analyser_stat_threshold: [only for analyser='chi2' and analyser='mwu']
    Threshold for the statistical tests. If a pair of hardware traces has the (normalized)
    statistics below the threshold, then the traces are considered equivalent.

    Note: The threshold default value (0.5) is conservative and avoids false positives
    at cost of false negatives. For more precise results, set the threshold to a lower value.

    For the chi2 test, the threshold is the statistics / (len(htrace1) + len(htrace2))
    For the mwu test, the threshold is the p-value """

    # ==============================================================================================
    # Coverage
    coverage_type: str = 'none'
    """ coverage_type: coverage type """

    # ==============================================================================================
    # Minimizer
    minimizer_retries: int = 1
    """ minimizer_retries: number of attempts to reproduce the violation when minimizing """

    # ==============================================================================================
    # Output
    multiline_output: bool = False
    """ multiline_output: """
    logging_modes: List[str] = ["info", "stat"]
    """ logging_modes: """
    color: bool = False

    # ==============================================================================================
    # Alternatives for config options (also extended by ISA-specific config.py)
    _option_values: Dict[str, List[str]] = {
        "fuzzer": ["basic", "architectural", "archdiff"],
        "generator": ["random"],
        "instruction_set": ["x86-64", "arm64"],
        "data_generator": ["random"],
        "model_backend": ["dummy", "unicorn", "dynamorio"],
        "contract_execution_clause": [
            "seq", "no_speculation", "seq-assist", "cond", "conditional_br_misprediction", "bpas",
            "nullinj-fault", "nullinj-assist", "delayed-exception-handling", "div-zero",
            "div-overflow", "meltdown", "fault-skip", "noncanonical", "vspec-ops-div",
            "vspec-ops-memory-faults", "vspec-ops-memory-assists", "vspec-ops-gp", "vspec-all-div",
            "vspec-all-memory-faults", "vspec-all-memory-assists"
        ],
        "contract_observation_clause": [
            "none", "l1d", "pc", "memory", "ct", "loads+stores+pc", "ct-nonspecstore", "ctr",
            "arch", "tct", "tcto", "ct-ni"
        ],
        "executor": ["x86-64-intel", "x86-64-amd", "arm64"],
        'executor_mode': [
            'P+P',
            'F+R',
            'E+R',
            'PP+P',
            'TSC',
            # 'GPR' is intentionally left out
        ],
        'faults_allowlist': [
            'div-by-zero',
            'div-overflow',
            'opcode-undefined',
            'breakpoint',
            'debug-register',
            'non-canonical-access',
            'user-to-kernel-access',
        ],
        "analyser": ["bitmaps", "sets", "mwu", "chi2"],
        "coverage_type": ["none", "model_instructions"],
        "logging_modes": [
            "info",
            "stat",
            "dbg_generator",
            "dbg_timestamp",
            "dbg_violation",
            "dbg_dump_htraces",
            "dbg_dump_ctraces",
            "dbg_dump_traces_unlimited",
            "dbg_model",
            "dbg_coverage",
            "dbg_priming",
            "dbg_executor_raw",
            "dbg_isa_filter",
        ],
    }

    # ==============================================================================================
    # Internal
    _borg_shared_state: Dict[Any, Any] = {}
    _no_generation: bool = False
    _handled_faults: List[str]  # set by ISA-specific config.py
    _generator_fault_to_fault_name: Dict[str, str]  # set by ISA-specific config.py
    _actors: ActorsConf
    _actor_default: ActorConf
    _config_path: str = ""

    def __init__(self) -> None:
        # implementation of Borg pattern
        setattr(self, '__dict__', self._borg_shared_state)
        if not getattr(self, '_actors', None):
            self._actors = OrderedDict()

    def load(self, config_path: str, include_dir: str = "") -> None:
        self._config_path = config_path
        config_update: Dict[str, Any] = {}
        with open(config_path, "r") as f:
            loader = IncludeLoader(f, include_dir)
            try:
                config_update = loader.get_single_data()
            except yaml.scanner.ScannerError as e:  # type: ignore
                raise ConfigException(
                    f"Error parsing the configuration file {config_path}:\nError: {e}") from e
            finally:
                loader.dispose()  # type: ignore
        self._load_from_dict(config_update)
        self._value_sanity_check()

    def _load_from_dict(self, config_update: Dict[str, Any]) -> None:
        # make sure to set the architecture-dependent defaults first
        if 'instruction_set' in config_update:
            self.instruction_set = config_update['instruction_set']
            self.set_to_arch_defaults()
            config_update.pop('instruction_set')

        # recursively load included files
        file_keys = []
        for k, v in config_update.items():
            if "file_" in k:
                self._load_from_dict(v)
                file_keys.append(k)
        for k in file_keys:  # remove the `file_*` keys as they have already been processed
            config_update.pop(k)

        # set the rest of the options
        for var, value in config_update.items():
            # print(f"CONF: setting {var} to {value}")
            if var == "faults_allowlist":
                self.update_handled_faults_with_generator_faults(value)
                self.safe_set(var, value)
                continue
            if var == "instruction_blocklist_append":
                self.instruction_blocklist.extend(value)
                continue
            if var == "actors":
                self.set_actor_properties(value)
                continue
            if var == "instruction_categories":
                backend = config_update.get("model_backend", self.model_backend)
                if backend == "unicorn":
                    options_name = "unicorn_instruction_categories"
                elif backend == "dynamorio":
                    options_name = "dr_instruction_categories"
                else:
                    options_name = "dr_instruction_categories"
                self.safe_set(var, value, options_name)

            self.safe_set(var, value)

    def safe_set(self, name: str, value: Any, options_name: str = "") -> None:
        assert name not in ["instruction_set"]

        # sanity checks
        if name[0] == "_":
            raise ConfigException(f"Attempting to set an internal configuration variable {name}.")
        if getattr(self, name, None) is None:
            raise ConfigException(f"Unknown configuration variable {name}.\n"
                                  f"It's likely a typo in the configuration file.")
        if type(self.__getattribute__(name)) != type(value):
            raise ConfigException(f"Wrong type of the configuration variable {name}.\n"
                                  f"It's likely a typo in the configuration file.")

        if options_name:
            self._check_options(options_name, value)
        else:
            self._check_options(name, value)
        setattr(self, name, value)

    def _check_options(self, name: str, value: Any) -> None:
        if name not in self._option_values:
            return
        options = self._option_values[name]

        invalid_value = None
        if isinstance(value, str):
            invalid_value = value if value not in options else None
        elif isinstance(value, List):
            for v in value:
                if v in options:
                    continue
                if isinstance(v, Dict):
                    for k in v:
                        if k not in options:
                            break
                    else:
                        continue
                invalid_value = v
                break
        else:
            raise ConfigException(f"Unexpected type of config variable {name}")

        if invalid_value:
            raise ConfigException(f"Unknown value '{invalid_value}' of config variable '{name}'\n"
                                  f"Possible options: {options}")
        return

    def _value_sanity_check(self) -> None:
        """
        Check if the configuration values make sense
        """
        if self.data_generator_entropy_bits > 32:
            raise ConfigException("data_generator_entropy_bits must be less or equal to 32 bits")
        if self.min_successors_per_bb > self.max_successors_per_bb:
            raise ConfigException("min_successors_per_bb is larger than max_successors_per_bb")

    def set_to_arch_defaults(self) -> None:
        """ Set config options according to the architecture-specific defaults """

        config: ModuleType
        if self.instruction_set == "x86-64":
            config = x86_config
        elif self.instruction_set == "arm64":
            config = arm64_config
        else:
            raise ConfigException(f"Unknown architecture {self.instruction_set}")

        config_defaults = {}
        for c in dir(config):
            if c.startswith("__"):
                continue
            values = getattr(config, c)
            if type(values) not in [bool, int, float, str, dict, list]:
                continue
            config_defaults[c] = values

        if "_option_values" not in config_defaults:
            raise ConfigException("ISA-specific config.py must define _option_values")

        for name, value in config_defaults.items():
            if name == "faults_allowlist":
                self.update_handled_faults_with_generator_faults(value)
                continue
            if name == "_actor_default":
                self._actor_default = deepcopy(value)
                self._actors = OrderedDict()
                self._actors['main'] = deepcopy(value)
                continue
            if name == "_option_values":
                for k, v in value.items():
                    self._option_values[k] = v
                continue

            setattr(self, name, value)

    def update_handled_faults_with_generator_faults(self, new: List[str]) -> None:
        for gen_fault in new:
            if not gen_fault:
                continue
            if gen_fault not in self._generator_fault_to_fault_name:
                raise ConfigException(f"Unknown generator fault {gen_fault}")
            fault = self._generator_fault_to_fault_name[gen_fault]
            if fault not in self._handled_faults:
                self._handled_faults.append(fault)

    def set_actor_properties(self, new: List[Dict[str, List[Dict[ActorConfKey, Any]]]]) -> None:
        for actor_dict in new:
            name = next(iter(actor_dict))
            self._check_options("actor", actor_dict[name])
            update = {k: v for tmp_dict in actor_dict[name] for k, v in tmp_dict.items()}

            if name == "main":
                if update.get('mode', 'host') != 'host':
                    raise ConfigException("The main actor must be in 'host' mode")
                if update.get('privilege_level', 'kernel') != 'kernel':
                    raise ConfigException("The main actor must have 'kernel' privilege_level")

            if name in self._actors:
                entry = self._actors[name]
            else:
                entry = deepcopy(self._actor_default)
                entry["name"] = name

            for k, v in update.items():
                if k == "mode" and v not in self._option_values["actor_mode"]:
                    raise ConfigException(f"Unsupported actor mode {v}")
                if k == "privilege_level" and v not in self._option_values["actor_privilege_level"]:
                    raise ConfigException(f"Unsupported actor privilege_level {v}")

                if k == "data_properties":
                    for property_ in v:
                        for p_key, p_value in property_.items():
                            if p_key not in self._option_values["actor_data_properties"]:
                                raise ConfigException(
                                    f"Unsupported actor data_properties value {p_key}")
                            entry[k][p_key] = p_value
                    continue
                if k == "data_ept_properties":
                    if update.get('mode', 'host') != 'guest':
                        raise ConfigException("data_ept_properties can only be used in guest mode")
                    for property_ in v:
                        for p_key, p_value in property_.items():
                            if p_key not in self._option_values["actor_data_ept_properties"]:
                                raise ConfigException(
                                    f"Unsupported actor data_ept_properties value {p_key}")
                            entry[k][p_key] = p_value
                    continue
                if k == "instruction_blocklist" or k == "fault_blocklist":
                    if v:
                        entry[k].update(v)
                    continue

                entry[k] = v
            self._actors[name] = entry

    def disable_generation(self) -> None:
        """ Disable random-generation mode """
        self._no_generation = True

    def is_generation_enabled(self) -> bool:
        """ Check if the generation is globally enabled """
        return not self._no_generation

    def get_actors_conf(self) -> ActorsConf:
        """ Get the configuration dictionary describing all actors """
        return self._actors


CONF = Conf()
CONF.set_to_arch_defaults()


================================================
FILE: rvzr/data_generator.py
================================================
"""
File: Input Generation.

      An input is a sequence of bytes that is used to initialize memory and registers in
      the model or executor before running a test case program. The input generator
      is responsible for generating random inputs for the test cases.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import os
import random
from typing import List, Tuple, Final

import numpy as np

from .tc_components.test_case_data import InputData, InputTaint
from .config import CONF
from .logs import inform

POW32 = pow(2, 32)


class DataGenerator:
    """ Class responsible for generating random inputs for test cases. """

    _state: int = 0
    _boosting_state: int = 0
    _max_gpr_value: Final[int] = pow(2, 64) - 1

    def __init__(self, seed: int):
        self.max_input_value = pow(2, CONF.data_generator_entropy_bits)
        self._state = seed

        self._skip_special_values = CONF.input_gen_probability_of_special_value == 0
        self._probability_of_zero = CONF.input_gen_probability_of_special_value
        self._probability_of_max = CONF.input_gen_probability_of_special_value * 2
        assert self._probability_of_max < 1, \
            "The sum of probabilities of special values must be less than 1."

    def get_state(self) -> int:
        """
        Return the current state of the generator.
        State is the seed value that will be used to generate the next input.
        """
        return self._state

    def _reset_boosting_state(self) -> None:
        """ Reset the state (i.e., seed) of the generator to the last state before boosting """
        self._boosting_state = self._state

    def generate(self, count: int, n_actors: int) -> List[InputData]:
        """
        Generate a list of random inputs.
        :param count: The number of inputs to generate
        :return: A list of generated inputs
        """
        # if it's the first invocation and the seed is zero - use random seed
        if self._state == 0:
            self._state = random.randint(0, pow(2, 32) - 1)
            inform("data_gen", f"Setting input seed to: {self._state}")

        generated_inputs = []
        for _ in range(count):
            input_, self._state = self._generate_one(self._state, n_actors)
            generated_inputs.append(input_)

        # make sure that boosted inputs will continue from the updated state
        self._boosting_state = self._state
        return generated_inputs

    def generate_boosted(self, inputs: List[InputData], taints: List[InputTaint],
                         inputs_per_class: int) -> List[InputData]:
        """
        Extend the given input sequence with new inputs such that the new inputs should produce
        the same contract traces as the original inputs. This achieved by copying the original
        inputs and modifying them based on the taints collected by the model while tracing the
        test case with the original inputs (i.e, non-tainted values are replaced with random values,
        and the tainted values are copied).

        For example, if the original inputs are [A, B, C] and inputs_per_class=3,
        then the new sequence will be [A, B, C, A', B', C', A'', B'', C''],
        where A, A', and A'' produce the same contract traces, and so on.

        NOTE: The function is idempotent, i.e., calling it multiple times with the same inputs
        and taints will produce the same sequence of new inputs. This is because the state of the
        generator is reset to the last state before boosting every time the function is called.
        """
        if not inputs:
            return []
        assert len(inputs) == len(taints), "Error: Cannot extend inputs. The number of taints" \
                                           " does not match the number of inputs."
        n_actors = len(inputs[0])
        input_size = InputData.n_data_entries_per_actor()

        self._reset_boosting_state()
        boosted_inputs = list(inputs)  # make a copy
        for _ in range(inputs_per_class - 1):
            for i, input_ in enumerate(inputs):
                # Generate new, fully random input
                new_input, self._boosting_state = self._generate_one(self._boosting_state, n_actors)

                # Copy tainted values from the original input
                for actor_id in range(n_actors):
                    taint = taints[i].linear_view(actor_id)
                    input_old = input_.linear_view(actor_id)
                    input_new = new_input.linear_view(actor_id)
                    for j in range(input_size):
                        if taint[j]:
                            input_new[j] = input_old[j]

                # Add the new input to the sequence
                boosted_inputs.append(new_input)
        return boosted_inputs

    def load(self, input_paths: List[str]) -> List[InputData]:
        """
        Load a sequence of inputs from a directory with binary inputs.
        """
        # mirror the state update in generate() as 'load' function is used for reproducing
        # violations, which requires the generator state to be identical to the one during
        # fuzzing
        if self._state == 0:
            self._state = random.randint(0, pow(2, 32) - 1)
            inform("data_gen", f"Setting input seed to: {self._state}")

        inputs = []
        n_actors = len(CONF.get_actors_conf())
        for input_path in input_paths:
            input_ = InputData(n_actors)

            # check that the file is not corrupted
            size = os.path.getsize(input_path)
            expected = input_.itemsize * n_actors
            if size != expected:
                raise ValueError(f"Incorrect size of input `{input_path}` "
                                 f"({size} B, expected {expected} B)")

            input_.load(input_path)
            inputs.append(input_)
            self._state += 1

        self._boosting_state = self._state
        return inputs

    def _generate_one(self, state: int, n_actors: int) -> Tuple[InputData, int]:
        input_ = InputData(n_actors)
        input_.seed = state

        per_actor_data_size = input_.itemsize // 8
        n_registers = input_[0]['gpr'].itemsize

        rng = np.random.default_rng(seed=state)
        for i in range(n_actors):
            # generate random data
            data = rng.integers(
                self.max_input_value, size=per_actor_data_size, dtype=np.uint64)  # type: ignore

            # copy lower 32-bits to upper 32-bits, for every 8-byte word
            data = (data << np.uint64(32)) + data

            # for each of the registers and with a probability of 0.01
            # set the register to zero or to max value
            if not self._skip_special_values:
                for reg_id in range(n_registers):
                    roll = rng.random()
                    if roll < self._probability_of_zero:
                        input_[i]['gpr'][reg_id] = 0
                    elif roll < self._probability_of_max:
                        input_[i]['gpr'][reg_id] = self._max_gpr_value

            input_.set_actor_data(i, data)

        return input_, state + 1


================================================
FILE: rvzr/elf_parser.py
================================================
"""
File: Parsing of ELF files to populate sections of a TestCaseCode object.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import re
from typing import TYPE_CHECKING, Dict, List, Tuple, TypedDict, NamedTuple, Final
from subprocess import run
from elftools.elf.elffile import ELFFile, SymbolTableSection  # type: ignore

from rvzr.tc_components.test_case_binary import SymbolTable, SymbolTableEntry, TestCaseBinary
from rvzr.tc_components.actor import ActorPL, ActorMode
from rvzr.tc_components.instruction import Instruction
from rvzr.config import CONF

if TYPE_CHECKING:
    from rvzr.tc_components.test_case_code import TestCaseProgram, CodeSection
    from rvzr.tc_components.test_case_binary import InstructionMap
    from rvzr.target_desc import TargetDesc


class _ParsingError(Exception):

    def __init__(self, message: str):
        full_msg = f"[ELFParser] Error while parsing assembly\n       Issue: {message}"
        super().__init__(full_msg)


# ==================================================================================================
# Private: ELF Symbol Table Parser
# ==================================================================================================
class _ELFData(TypedDict):
    section_data: Dict[int, _SectionData]
    exit_addr: int


class _SectionData(TypedDict):
    id_: int
    name: str
    offset: int
    size: int
    functions: Dict[str, _FunctionData]


class _FunctionData(TypedDict):
    id_: int
    name: str
    offset: int


class _SymtabParser:

    def parse(self, obj_file: str) -> _ELFData:
        """
        Parse the ELF symbol table to get the addresses of all functions and sections.
        The section and function IDs are assigned in the order they appear in the ELF file.
        :param obj_file: path to the ELF file
        :return: a dictionary containing the section data and the exit address
        """
        elf_data = self._get_unsorted_data(obj_file)
        self._sort_elf_data(elf_data)
        return elf_data

    def _get_unsorted_data(self, obj_file: str) -> _ELFData:
        """ Transform the ELF symbol table into a dictionary of sections and functions """
        elf_data: _ELFData = {"section_data": {}, "exit_addr": -1}

        with open(obj_file, "rb") as f:
            data = ELFFile(f)

            # sanity check: we build test cases in such a way that there should be no segments
            assert data.num_segments() == 0, f"{data.num_segments()}"

            # collect section info
            for s_id, s in enumerate(data.iter_sections()):
                if s.name[:6] != ".data.":
                    continue
                s_entry: _SectionData = {
                    "id_": s_id,
                    "name": s.name.split(".")[2],
                    "offset": s['sh_offset'],
                    "size": s['sh_size'],
                    "functions": {}
                }
                elf_data["section_data"][s_id] = s_entry

            # get addresses of functions and macros
            symtab: SymbolTableSection = data.get_section_by_name(".symtab")  # type: ignore
            for s in symtab.iter_symbols():
                if s.name.startswith(".function"):
                    f_entry: _FunctionData = {
                        "id_": -1,  # will be assigned later
                        "name": s.name,
                        "offset": s.entry.st_value
                    }
                    s_id = s['st_shndx']
                    elf_data["section_data"][s_id]["functions"][s.name] = f_entry

                if ".test_case_exit" in s.name:
                    elf_data["exit_addr"] = s.entry.st_value
        assert elf_data["exit_addr"] != -1, "Failed to find exit address"
        return elf_data

    def _sort_elf_data(self, elf_data: _ELFData) -> None:
        """ Sort sections and functions by their appearance in the ELF file """

        # assign consecutive ids to sections, in the order they appear in ELF
        sorted_section_ids = sorted(elf_data["section_data"].keys())
        new_section_data = {}
        for new_s_id, org_s_id in enumerate(sorted_section_ids):
            new_section_data[new_s_id] = elf_data["section_data"][org_s_id]
            new_section_data[new_s_id]["id_"] = new_s_id
        elf_data["section_data"] = new_section_data

        # assign consecutive ids to functions, in the order they appear in ELF
        sorted_new_section_ids = sorted(elf_data["section_data"].keys())
        new_f_id = 0  # function ids are unique across all sections
        for s_id in sorted_new_section_ids:
            function_data = elf_data["section_data"][s_id]["functions"]
            sorted_function_data = sorted(function_data.values(), key=lambda x: x["offset"])
            for f_data in sorted_function_data:
                f_data["id_"] = new_f_id
                new_f_id += 1


# ==================================================================================================
# Private: Objdump Output Parser
# ==================================================================================================
_SectionName = str
_InstructionAddr = int
_InstrAddrMap = Dict[_SectionName, List[_InstructionAddr]]


class _ObjdumpSectionDesc(NamedTuple):
    name: str
    skip: bool


class _ObjdumpOutputParser:

    def __init__(self) -> None:
        self._objdump_flags = "--no-show-raw-insn -D -M intel -m i386:x86-64"
        if CONF.instruction_set == "arm64":
            self._objdump_flags = "--no-show-raw-insn -D -m aarch64"

    def parse(self, obj_file: str) -> _InstrAddrMap:
        """
        Parse the output of objdump to get the addresses of all instructions
        :param obj_file: path to the ELF file
        :return: a dictionary mapping section names to lists of its instruction addresses
        """
        # Get raw objdump output
        dump = run(
            f"objdump {self._objdump_flags} {obj_file} "
            "| awk '/ [0-9a-f]+:/{print $1} /section/{print $0}'",
            shell=True,
            check=True,
            capture_output=True)

        # Prepare for parsing
        instruction_addresses: Dict[_SectionName, List[_InstructionAddr]] = {}
        section_desc = _ObjdumpSectionDesc("", False)

        # Loop over output lines, keeping track of the latest section header,
        # and recording addresses of instructions for each section
        for line in dump.stdout.decode().split("\n"):
            if not line:
                continue

            # Enter a new section
            if "section" in line:
                section_desc = self._parse_section_header(line)
                assert section_desc.name not in instruction_addresses
                instruction_addresses[section_desc.name] = []
                continue

            # Skip instruction in ignored sections
            if section_desc.skip:
                continue

            # Parse instruction addresses
            assert section_desc.name != "", "Failed to parse objdump output (section_name)"
            instruction_addresses[section_desc.name].append(int(line[:-1], 16))

        return instruction_addresses

    def _parse_section_header(self, line: str) -> _ObjdumpSectionDesc:
        if ".note.gnu" in line:
            return _ObjdumpSectionDesc("", True)
        if ".data." not in line:
            return _ObjdumpSectionDesc("", False)

        # Use regex to find .data.<section_name> pattern anywhere in the line
        match = re.search(r'\.data\.(\w+)', line)
        if match:
            section_name = match.group(1)
            return _ObjdumpSectionDesc(section_name, False)\

        # no match found
        raise _ParsingError("Failed to parse objdump output (section_name)\n"
                            f"       Could not find .data.<section_name> pattern in: '{line}'")


# ==================================================================================================
# Public Interface: Parser Class
# ==================================================================================================
class ELFParser:
    """
    ELF parser that extracts the following data from the ELF file:
    - Section data
    - Function data
    - Instruction addresses
    - Macros
    """
    _target_desc: Final[TargetDesc]

    def __init__(self, target_desc: TargetDesc) -> None:
        self._target_desc = target_desc
        self._instruction_per_macro = 3 if CONF.instruction_set == 'arm64' else 1

    # ----------------------------------------------------------------------------------------------
    # Public Methods
    def populate_elf_data(self, test_case_bin: TestCaseBinary,
                          test_case_code: TestCaseProgram) -> None:
        """
        Populate .symbol_table and .instruction_map attributes of a TestCaseBinary object
        by parsing the ELF file associated with this object (TestCaseBinary.obj_path).
        """
        # get metadata from the ELF file and objdump output
        symbol_table: SymbolTable
        instruction_map: InstructionMap
        symbol_table, instruction_map = self._assign_bin_metadata(test_case_bin.obj_path,
                                                                  test_case_code)

        # check that the data was populated correctly and the macros are well-formed
        self._validate_sections(test_case_code.get_sections(), instruction_map)
        self._validate_macros(test_case_code, symbol_table)

        # assign the parsed data to the test case
        test_case_bin.assign_elf_data(symbol_table, instruction_map)

    # ----------------------------------------------------------------------------------------------
    # Private: Assignment of metadata to Section -> Function -> Instruction

    def _assign_bin_metadata(self, obj_file: str,
                             test_case_code: TestCaseProgram) -> Tuple[SymbolTable, InstructionMap]:
        # pylint: disable=too-many-locals
        # NOTE: the check is disabled because I haven't found a way to reduce the number of locals

        # Initialize data structures
        symbol_table: SymbolTable = []
        instruction_map: InstructionMap = {}

        # Extract data from the ELF file and objdump output
        elf_data = _SymtabParser().parse(obj_file)
        instr_addr_map = _ObjdumpOutputParser().parse(obj_file)

        # Use the data to construct the symbol table and instruction map
        sorted_sections = sorted(elf_data["section_data"].values(), key=lambda x: x["id_"])
        all_functions = [f for s in sorted_sections for f in s["functions"].values()]
        for section_data in sorted_sections:
            # Assign section metadata
            section_obj = test_case_code.find_section(name=section_data["name"])
            self._assign_section_metadata(section_data, section_obj)

            # Assign function metadata
            sorted_functions = sorted(section_data["functions"].values(), key=lambda x: x["id_"])
            for func_data in sorted_functions:
                self._assign_function_metadata(func_data, section_data, symbol_table)

            # Create a local instruction map for the section
            instruction_map[section_data["id_"]] = {}

            # Assign instruction metadata
            cursor = 0
            for func_data in sorted_functions:
                function_object = test_case_code.find_function(func_data["name"])
                assert function_object.get_owner() == section_obj.owner
                assert func_data["offset"] == instr_addr_map[section_data["name"]][cursor], \
                    f"offsets: {func_data['offset']} {instr_addr_map[section_data['name']][cursor]}"

                for bb in list(function_object) + [function_object.get_exit_bb()]:
                    for inst in list(bb) + bb.terminators:
                        self._assign_instruction_metadata(inst, instr_addr_map, cursor,
                                                          section_data, instruction_map)
                        if inst.name != "macro":
                            cursor += 1
                            continue

                        # Assign metadata for macros
                        self._assign_macro_metadata(inst, sorted_sections, all_functions,
                                                    symbol_table)
                        cursor += self._instruction_per_macro

        # Fixup: the last instruction in .data.main is the test case exit, and it must map to a NOP
        exit_nop = Instruction("nop", "BASE-NOP", is_instrumentation=True)
        instr_addr_map["main"].append(elf_data["exit_addr"])
        self._assign_instruction_metadata(exit_nop, instr_addr_map, len(instruction_map[0]),
                                          sorted_sections[0], instruction_map)

        # Sort symbols in the symbol table by section id and offset within the section
        symbol_table.sort(key=lambda x: (x.sid, x.offset))

        return symbol_table, instruction_map

    @staticmethod
    def _assign_section_metadata(section_data: _SectionData, section_obj: CodeSection) -> None:
        section_obj.assign_elf_data(
            offset=section_data["offset"], size=section_data["size"], id_=section_data["id_"])

    @staticmethod
    def _assign_function_metadata(func_data: _FunctionData, section_data: _SectionData,
                                  symbol_table: SymbolTable) -> None:
        func_symbol = SymbolTableEntry(
            sid=section_data["id_"],
            type_=0,
            offset=func_data["offset"],
            arg=func_data["id_"],
        )
        symbol_table.append(func_symbol)

    def _assign_instruction_metadata(self, inst: Instruction, instr_addr_map: _InstrAddrMap,
                                     cursor: int, section_data: _SectionData,
                                     instr_map: InstructionMap) -> None:
        section_name = section_data["name"]
        instr_addr_map_in_sec = instr_addr_map[section_name]

        # get instruction info
        address = instr_addr_map_in_sec[cursor]
        if cursor + 1 < len(instr_addr_map_in_sec):
            size = instr_addr_map_in_sec[cursor + 1] - address
        else:
            size = 0

        # assign instruction metadata
        inst.assign_binary_properties(section_id=section_data["id_"], offset=address, size=size)

        # add instruction to the instruction map
        instr_map[section_data["id_"]][address] = inst

        # if the instruction is a macro, it may span several instructions;
        # make it look like it does by adding NOPs to the instruction map
        if inst.name == "macro":
            for i in range(1, self._instruction_per_macro):
                address = instr_addr_map_in_sec[cursor + i]
                nop_placeholder = Instruction("nop", "BASE-NOP")
                nop_placeholder.is_macro_placeholder = True
                instr_map[section_data["id_"]][address] = nop_placeholder

    def _assign_macro_metadata(self, inst: Instruction, sections_data: List[_SectionData],
                               functions_data: List[_FunctionData],
                               symbol_table: SymbolTable) -> None:
        """
        Convert a macro instruction to a symbol table entry by parsing its symbolic arguments
        according to the macro specification (see x86_target_desc.py). Add the resulting
        symbol to the symbol table.

        Example:
        - Input (macro instruction): MACRO 1, .main.function_1
        - Processing:
            type: 1 (actor switch)
            arg 1: main -> 0 (offset of section main)
            arg 2: function_1 -> 12 (offset of function function_1 within section main)
            arg 3: none
            arg 4: none
            compressed macro argument: 0 + (12 << 16) + (0 << 32) + (0 << 48) = 786432
        - Output (symbol table entry): SymbolTableEntry(0, 1, 0, 786432)
        """

        # pylint: disable=too-many-locals
        # NOTE: the check is disabled because I haven't found a way to reduce the number of locals

        def section_name_to_id(name: str) -> int:
            for entry in sections_data:
                if entry["name"] == name:
                    return entry["id_"]
            raise _ParsingError(f"Macro references an unknown actor {name}")

        def function_name_to_id(name: str) -> int:
            for entry in functions_data:
                if entry["name"] == name:
                    return entry["id_"]
            raise _ParsingError(f"Macro references an unknown function {name}")

        assert inst.name == "macro"

        # find the spec for this macro arguments
        macro_name = inst.operands[0].value[1:].lower()
        try:
            macro_spec = self._target_desc.macro_specs[macro_name]
        except IndexError as e:
            raise _ParsingError(f"Unknown macro {macro_name} in {inst}") from e

        # convert macro operands to compressed symbol arguments
        str_args = inst.operands[1].value.split('.')[1:]
        symbol_args: int = 0
        for i, str_arg in enumerate(str_args):
            str_arg = str_arg.lower()
            if macro_spec.args[i] == "":
                continue
            if macro_spec.args[i] == "actor_id":
                actor_id = section_name_to_id(str_arg)
                symbol_args += (actor_id << i * 16)
                continue
            if macro_spec.args[i] == "function_id":
                symbol_args += (function_name_to_id("." + str_arg) << i * 16)
                continue
            if macro_spec.args[i] == "int":
                if str_arg.startswith("0x"):
                    val = int(str_arg, 16) & 0xFFFF
                else:
                    val = int(str_arg) & 0xFFFF
                symbol_args += (val << i * 16)
                continue
            raise ValueError(f"Invalid macro argument {macro_spec.args[i]}")

        # add the macro to the symbol table
        symbol_table.append(
            SymbolTableEntry(
                sid=inst.section_id(),
                type_=macro_spec.type_,
                offset=inst.section_offset(),
                arg=symbol_args,
            ))

    # ----------------------------------------------------------------------------------------------
    # Private: Validation of the parsed data
    def _validate_sections(self, sections: List[CodeSection],
                           instruction_map: InstructionMap) -> None:
        """
        Validate that all sections in the test case have been populated with ELF data
        :param sections: list of sections in the test case
        :param instruction_map: constructed InstructionMap
        :return: None
        :raises _ParsingError: if at least one section was not populated
        :raises _ParsingError: if the instruction map does not match the sections
        """
        if len(instruction_map) != len(sections):
            raise _ParsingError(
                "InstructionMap does not have the same number of sections as the test case")

        for section_obj in sections:
            try:
                _ = section_obj.get_elf_data()  # will throw an exception if the section is not set
            except AssertionError as e:
                raise _ParsingError(f"Failed to find section for actor `{section_obj.name}`") from e

    def _validate_macros(self, test_case: TestCaseProgram, symbol_table: SymbolTable) -> None:
        """ Validate that all macros in the test case are well-formed """
        for symbol in symbol_table:
            if symbol.type_ == 0:  # function
                continue
            macro_spec = self._target_desc.get_macro_spec_from_type(symbol.type_)

            # validate that the actor id is valid
            for i in range(4):
                if macro_spec.args[i] != "actor_id":
                    continue
                target_actor_id = (symbol.arg >> (i * 16)) & 0xFFFF

                # check that the actor exists
                try:
                    actor = test_case.find_actor(actor_id=target_actor_id)
                except KeyError as e:
                    raise _ParsingError(
                        f"Macro references an unknown actor id {target_actor_id}") from e

                # validate that the actor type matches the macro
                if macro_spec.name == "set_k2u_target" and \
                   actor.privilege_level != ActorPL.USER and actor.mode != ActorMode.HOST:
                    raise _ParsingError("Macro set_k2u_target expects a user actor")
                if macro_spec.name == "set_u2k_target" and \
                   actor.privilege_level != ActorPL.KERNEL and actor.mode != ActorMode.HOST:
                    raise _ParsingError("Macro set_u2k_target expects a kernel actor")
                if macro_spec.name == "set_h2g_target" and \
                   actor.mode != ActorMode.HOST and actor.privilege_level != ActorPL.KERNEL:
                    raise _ParsingError("Macro set_h2g_target expects a host actor")
                if macro_spec.name == "set_g2h_target" and \
                   actor.mode != ActorMode.GUEST and actor.privilege_level != ActorPL.KERNEL:
                    raise _ParsingError("Macro set_g2h_target expects a guest actor")


================================================
FILE: rvzr/executor.py
================================================
"""
File: Architecture-independent parts of the adaptor to the executor kernel module

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import TYPE_CHECKING, List, Tuple, Set, Generator, Optional, Final
from abc import ABC

import sys
import subprocess
import os.path

import numpy as np
import numpy.typing as npt

from rvzr.logs import ExecutorLogger, warning
from rvzr.config import CONF, ConfigException
from rvzr.sandbox import BaseAddrTuple
from rvzr.stats import FuzzingStats
from rvzr.traces import HTrace, RawHTraceSample, HTraceType
from rvzr.tc_components.test_case_data import save_input_sequence_as_rdbf

if TYPE_CHECKING:
    from rvzr.tc_components.test_case_code import TestCaseProgram
    from rvzr.tc_components.test_case_data import InputData

KMOutputLine = Tuple[int, int, int, int, int, int]
ReadingsArray = npt.NDArray[np.void]

STAT = FuzzingStats()


# ==================================================================================================
# Helper functions
# ==================================================================================================
def km_write(value: str, path: str) -> None:
    """
    Write a value to a file in the /sys filesystem.
    This is used to configure the executor kernel module.
    """
    subprocess.run(f"echo -n {value} > {path}", shell=True, check=True)


def _is_smt_enabled() -> bool:
    """
    Check if SMT is enabled on the current CPU.

    :return: True if SMT is enabled, False otherwise
    """
    try:
        out = subprocess.run("lscpu", shell=True, check=True, capture_output=True)
    except subprocess.CalledProcessError:
        warning("executor", "Could not check if SMT is enabled. Is lscpu installed?")
        return True
    for line in out.stdout.decode().split("\n"):
        if line.startswith("Thread(s) per core:"):
            if line[-1] == "1":
                return False
            return True
    return True


def _can_set_reserved() -> bool:
    """
    Check if setting reserved bits is possible on the current CPU.
    :return: True if it's possible, False otherwise
    """
    actors_conf = CONF.get_actors_conf()
    reserved_requested = False
    for a in actors_conf:
        if 'reserved_bit' in actors_conf[a]['data_properties'] and \
           actors_conf[a]['data_properties']['reserved_bit']:
            reserved_requested = True
            break
        if 'reserved_bit' in actors_conf[a]['data_ept_properties'] and \
           actors_conf[a]['data_ept_properties']['reserved_bit']:
            reserved_requested = True
            break
    if not reserved_requested:
        return True

    if CONF.instruction_set == 'arm64':
        return False  # reserved bits are not (yet?) supported on ARM64

    assert CONF.instruction_set == 'x86-64'
    physical_bits = int(
        subprocess.run(
            "lscpu | grep 'Address sizes' | awk '{print $3}'",
            shell=True,
            check=True,
            capture_output=True).stdout.decode().strip())
    if physical_bits > 51:
        return False
    return True


def _is_kernel_module_installed() -> bool:
    return os.path.isfile("/sys/rvzr_executor/trace")


def _configure_kernel_module() -> None:
    km_write(str(CONF.executor_warmups), '/sys/rvzr_executor/warmups')
    km_write("1" if CONF.enable_pre_run_flush else "0", "/sys/rvzr_executor/enable_pre_run_flush")
    km_write(CONF.executor_mode, "/sys/rvzr_executor/measurement_mode")


def _read_trace(n_reps: int,
                n_inputs: int,
                arch_mode: bool = False) -> Generator[Tuple[int, int, KMOutputLine], None, None]:
    """
    ProgramGenerator function that reads and parses the output of the kernel module.
    The generator handles the batched output of the kernel module and yields the traces one by one.
    The traces are read in reverse order.

    Example:
    Assume the kernel module output for n_reps=2 and n_inputs=2 is:
    ```
    htrace1, pfc0, .., pfc4
    htrace0, pfc0, .., pfc4
    done
    htrace1, pfc0, .., pfc4
    htrace0, pfc0, .., pfc4
    done
    ```
    then the generator will yield the following tuples:
    ```
    (0, 1, [htrace1, pfc0, .., pfc4])
    (0, 0, [htrace0, pfc0, .., pfc4])
    (1, 1, [htrace1, pfc0, .., pfc4])
    (1, 0, [htrace0, pfc0, .., pfc4])
    ```

    :param n_reps: number of repetitions of the measurements
    :param n_inputs: number of inputs
    :param arch_mode: if True, the kernel module is in architecture mode
    :return: a generator that yields a tuple (repetition, input_id, htrace, [pfc1, ..., pfc5])
    :raises IOError: if the kernel module output is malformed
    """
    if n_inputs <= 0:
        return

    rep_id = 0
    last_input_id = n_inputs - 1
    while rep_id < n_reps:
        input_id: int = last_input_id
        reading_finished: bool = False
        while not reading_finished:
            # read the next batch of traces from the kernel module
            output = subprocess.check_output(
                f"taskset -c {CONF.executor_taskset} cat /sys/rvzr_executor/trace", shell=True)
            lines = output.decode().split("\n")

            # parse the output
            for line in lines:
                # print(rep_id, input_id, line)
                # skip empty lines
                if not line:
                    continue

                # we reached the end of the batch? read the next batch
                if 'done' in line:
                    reading_finished = True
                    break

                # transform the line into a sequence of ints
                line_ints = tuple(int(x) for x in line.split(","))

                # if the line width is unexpected, it's an error
                if len(line_ints) != 6:
                    warning("executor", f"Unexpected line width: {len(line_ints)}")
                    _rewind_km_output_to_end()
                    raise IOError()

                # if the hardware trace is zero, it's an error (except for arch mode)
                if line_ints[0] == 0 and not arch_mode:
                    warning("executor", "Kernel module error; see dmesg for details")
                    _rewind_km_output_to_end()
                    raise IOError()

                # yield the trace
                yield rep_id, input_id, line_ints

                # move to next input
                input_id -= 1
                if input_id < 0:
                    # if we reached the end of a repetition, restart the input counter
                    input_id = last_input_id
                    rep_id += 1
        assert input_id == last_input_id, f"input_id: {input_id}, rep_id: {rep_id}"
    return


def _rewind_km_output_to_end() -> None:
    """
    Read to the end of the kernel module output, until the 'done' line.
    """
    while True:
        output = subprocess.check_output(
            f"taskset -c {CONF.executor_taskset} cat /sys/rvzr_executor/trace", shell=True)
        if 'done' in output.decode():
            break


# ==================================================================================================
# Public: Implementation of the python adapter to the executor kernel module
# ==================================================================================================
class Executor(ABC):
    """
    Interface for the executor module. The executor is a module responsible for executing
    test cases on the CPU-under-test and collecting the corresponding hardware traces.

    The high-level workflow is as follows:
    1. Load the test case code into the kernel module.
    2. Load the test case data (i.e., input sequence) into the kernel module.
    3. Run the measurements by calling the kernel module (see _get_raw_measurements). Each
       measurement is repeated `n_reps` times.
    4. Aggregate the measurements into sets of traces (see _aggregate_measurements).
    """

    _curr_test_case: Optional[TestCaseProgram] = None
    _ignore_list: Set[int]
    _log: Final[ExecutorLogger]
    _TSC_MASK: Final[np.uint64] = np.uint64(0x0FFFFFFFFFFFFFF0)

    _enable_mismatch_check_mode: Final[bool]
    """ mismatch_check_mode: If True, the executor will return GPR values instead of
    hardware traces, which is used to check for mismatches between the model and the executor """

    def __init__(self, enable_mismatch_check_mode: bool = False, skip_setup: bool = False):
        super().__init__()
        self._enable_mismatch_check_mode = enable_mismatch_check_mode

        self._ignore_list = set()
        self._log = ExecutorLogger()
        if skip_setup:
            warning("executor", "Executor starting without setting up the kernel module")
            return

        # Check the execution environment:
        if _is_smt_enabled() and not enable_mismatch_check_mode:
            warning("executor", "SMT is on! You may experience false positives.")
        if not _can_set_reserved():
            raise ConfigException("Cannot set reserved bits on this CPU")

        # Initialize the kernel module
        if not _is_kernel_module_installed():
            print("x86 executor: kernel module not installed\n\n"
                  "Go to https://microsoft.github.io/side-channel-fuzzer/quick-start/ for "
                  "installation instructions.")
            sys.exit(1)
        _configure_kernel_module()
        self._set_vendor_specific_features()

    # ==============================================================================================
    # Public Interface: Test Case Loading and Tracing
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Load a test case into the executor.
        This function must be called before calling `trace_test_case`.

        This function also sets the mismatch check mode in the kernel module if requested.
        The flag has to be set before loading the test case because the kernel module links
        the test case code with different measurement functions based on this flag.

        :param test_case: the test case object to load
        :return: None
        """
        # enable mismatch check mode if requested
        km_write("1" if self._enable_mismatch_check_mode else "0",
                 "/sys/rvzr_executor/enable_dbg_gpr_mode")

        # write the test case to the kernel module
        test_case.get_obj().save_rcbf('/sys/rvzr_executor/test_case')
        self._curr_test_case = test_case

        # reset the ignore list; as we are testing a new program now, the old ignore list is not
        # relevant anymore
        self._ignore_list = set()

    def trace_test_case(self, inputs: List[InputData], n_reps: int) -> List[HTrace]:
        """ Call the executor kernel module to collect the hardware traces for
         the test case (previously loaded with `load_test_case`) and the given inputs.

        :param inputs: list of inputs to be used for the test case
        :param n_reps: number of times to repeat each measurement
        :return: a list of HTrace objects, one for each input
        :raises IOError: if the kernel module output is malformed
        """
        # Skip if it's a dummy call
        if not inputs:
            return []
        n_inputs = len(inputs)

        # Skip if all inputs are ignored
        if n_inputs <= len(self._ignore_list):
            warning("executor", "All inputs are ignored. Skipping measurements")
            return [HTrace.empty_trace() for _ in range(n_inputs)]

        # Store statistics
        STAT.executor_reruns += n_reps * n_inputs

        # Transfer inputs to the kernel module
        # TODO: that's a quick-and-dirty optimization to reduce the number of KM calls;
        # it should be rewritten
        input_sequence = inputs if n_reps % 5 != 0 or n_inputs >= 1000 else inputs * 5
        save_input_sequence_as_rdbf(input_sequence, '/sys/rvzr_executor/inputs')

        # Check that the transfer was successful
        with open('/sys/rvzr_executor/inputs', 'r') as f:
            if f.readline() != '1\n':
                raise IOError("Error writing inputs to the kernel module")

        # Call the kernel module and read traces
        all_readings: ReadingsArray = np.ndarray(shape=(n_inputs, n_reps), dtype=RawHTraceSample)
        for rep_id, input_id, readings in \
                _read_trace(n_reps, n_inputs, arch_mode=self._enable_mismatch_check_mode):
            all_readings[input_id][rep_id] = readings

        # Post-process results and return a list of HTrace objects
        traces = self._raw_readings_to_traces(all_readings, n_inputs)
        self._log.dbg_dump_raw_traces(traces)
        return traces

    def _identify_trace_type(self) -> HTraceType:
        """ Identify the type of the traces based on the configuration """
        if self._enable_mismatch_check_mode:
            return "reg"
        if CONF.executor_mode == 'TSC':
            return "tsc"
        return "cache"

    def _raw_readings_to_traces(self, all_readings: ReadingsArray, n_inputs: int) -> List[HTrace]:
        """ Convert the raw readings into HTrace objects and perform post-processing if needed """
        traces = []
        trace_type = self._identify_trace_type()
        for input_id in range(n_inputs):
            raw = all_readings[input_id]

            # No post-processing in mismatch check mode
            if self._enable_mismatch_check_mode:
                traces.append(HTrace(raw, trace_type))
                continue

            # Zero-out traces for ignored inputs
            if input_id in self._ignore_list:
                traces.append(HTrace.invalid_trace(trace_type))
                continue

            # When using TSC mode, we need to mask the lower 4 bits of the trace
            if CONF.executor_mode == 'TSC':
                raw['trace'] &= self._TSC_MASK

            traces.append(HTrace(raw, trace_type))
        return traces

    # ==============================================================================================
    # Public Interface: Base Addresses
    def read_base_addresses(self) -> BaseAddrTuple:
        """
        Reads the base addresses of two sandbox regions (data and code) from the executor
        kernel module and returns them as a tuple.
        This data is primarily used to synchronize the memory layout between the executor
        and the model.
        :return: a tuple with the base addresses of the data and code regions
        """

        with open('/sys/rvzr_executor/print_data_base', 'r') as f:
            data_start = f.readline()
        with open('/sys/rvzr_executor/print_code_base', 'r') as f:
            code_start = f.readline()
        return int(data_start, 16), int(code_start, 16)

    # ==============================================================================================
    # Public Interface: Ignore List
    def set_ignore_list(self, ignore_list: List[int]) -> None:
        """
        Sets a list of inputs IDs that should be ignored by the executor.
        The executor will executed the inputs with these IDs as normal (in case they are
        necessary for priming the uarch state), but their htraces will be set to zero

        :param ignore_list: a list of input IDs to ignore
        """
        self._ignore_list = set(ignore_list)

    def extend_ignore_list(self, ignore_list: List[int]) -> None:
        """
        Add a list of new inputs IDs to the current ignore list.

        :param ignore_list: a list of input IDs to add to the ignore list
        """
        self._ignore_list.update(ignore_list)

    # ==============================================================================================
    # Public Interface: Quick and Dirty Mode
    def set_quick_and_dirty(self, state: bool) -> None:
        """
        Enable or disable the quick and dirty mode in the executor. In this mode, the executor
        will skip some of the stabilization phases, which will make the measurements faster but
        less reliable.

        :param state: True to enable the quick and dirty mode, False to disable it
        """
        km_write("1" if state else "0", "/sys/rvzr_executor/enable_quick_and_dirty_mode")

    # ==============================================================================================
    # Private Interface: Vendor-specific Features
    def _set_vendor_specific_features(self) -> None:
        """ Set vendor-specific features in the kernel module """


================================================
FILE: rvzr/executor_km/.clang-format
================================================
ColumnLimit: 100
IndentWidth: 4
BreakBeforeBraces: Linux
AllowShortIfStatementsOnASingleLine: false
AlignConsecutiveMacros:
  Enabled: true
  AcrossEmptyLines: false
  AcrossComments: false


================================================
FILE: rvzr/executor_km/.gitignore
================================================
.tmp*
*.o
*.cmd
*.symvers
*.order
*.ko
*.mod
*.mod.c
start_qemu.sh
update_module.sh

================================================
FILE: rvzr/executor_km/Makefile
================================================
NAME = rvzr_executor
KDIR=/lib/modules/$(shell uname -r)/build

# ==================================================================================================
# HW configuration
# ==================================================================================================
# Determine CPU vendor
ifneq ($(shell grep "Intel" /proc/cpuinfo),)
VENDOR_ID = 1
else ifneq ($(shell grep "AMD" /proc/cpuinfo),)
VENDOR_ID = 2
else ifneq ($(shell lscpu | grep "aarch64"),)
VENDOR_ID = 3
else
$(error "Unknown CPU vendor")
endif

# Physical address width
PHYSICAL_WIDTH = $(shell grep -m1 "bits physical," /proc/cpuinfo | awk '{print $$4}')

# Cache configuration
ifeq ($(shell ls /sys/devices/system/cpu/cpu0/cache/index0/ways_of_associativity 2>/dev/null),)
$(error "Cache info not found")
endif
L1D_ASSOCIATIVITY=$(shell cat /sys/devices/system/cpu/cpu0/cache/index0/ways_of_associativity)
L1D_SIZE_KB=$(shell cat /sys/devices/system/cpu/cpu0/cache/index0/size | sed 's/[^0-9]*//g')

# Check if VMBUILD is required
ifndef VMBUILD
sys_vendor = $(shell cat /sys/devices/virtual/dmi/id/sys_vendor)
is_vm_vendor = 'no'
ifeq ($(sys_vendor), QEMU)
is_vm_vendor = 'yes'
endif
ifeq ($(sys_vendor), Microsoft Corporation)
is_vm_vendor = 'yes'
endif
endif

# ==================================================================================================
# Files
# ==================================================================================================
# Object files
SRC_ = input_parser.c test_case_parser.c code_loader.c data_loader.c sandbox_manager.c \
	measurement.c main.c macro_expansion.c page_tables_host.c
SRC_X86 = x86/vmx.c x86/svm.c x86/perf_counters.c x86/page_tables_guest.c \
	x86/special_registers.c x86/idt.c x86/macros.c
ASM_X86 = x86/fault_handlers.S
SRC_ARM64 = arm64/fault_handler.c arm64/perf_counters.c arm64/special_registers.c \
	arm64/page_tables_guest.c arm64/macros.c
ASM_ARM64 = arm64/exception.S

ifeq ($(VENDOR_ID), 1)
SRC_ += $(SRC_X86)
ASM_ += $(ASM_X86)
else ifeq ($(VENDOR_ID), 2)
SRC_ += $(SRC_X86)
ASM_ += $(ASM_X86)
else ifeq ($(VENDOR_ID), 3)
SRC_ += $(SRC_ARM64)
ASM_ += $(ASM_ARM64)
endif

obj-m += $(NAME).o
$(NAME)-objs += $(SRC_:.c=.o) $(ASM_:.S=.o)

# ==================================================================================================
# Flags
# ==================================================================================================
# Common build flags
COMMON_CFLAGS := -I$(src)/include
COMMON_CFLAGS += -std=gnu11 -Wno-declaration-after-statement -Wno-comment
COMMON_CFLAGS += -g -DDEBUG
COMMON_CFLAGS += -DVENDOR_ID=$(VENDOR_ID)
COMMON_CFLAGS += -DFORCE_SMAP_OFF
COMMON_CFLAGS += -DPHYSICAL_WIDTH=$(PHYSICAL_WIDTH)
COMMON_CFLAGS += -DL1D_ASSOCIATIVITY=$(L1D_ASSOCIATIVITY)
COMMON_CFLAGS += -DL1D_SIZE_KB=$(L1D_SIZE_KB)

ifeq ($(VENDOR_ID), 1)
COMMON_CFLAGS += -msse2
else ifeq ($(VENDOR_ID), 2)
COMMON_CFLAGS += -msse2
endif

ifdef VMBUILD
COMMON_CFLAGS += -DVMBUILD
endif

# Set both EXTRA_CFLAGS (old kernels) and ccflags-y (new kernels) for compatibility
EXTRA_CFLAGS += $(COMMON_CFLAGS)
ccflags-y += $(COMMON_CFLAGS)

COMMON_AFLAGS := -I$(src)/include
COMMON_AFLAGS += -DVENDOR_ID=$(VENDOR_ID) -DPHYSICAL_WIDTH=$(PHYSICAL_WIDTH)
COMMON_AFLAGS += -DL1D_ASSOCIATIVITY=$(L1D_ASSOCIATIVITY) -DL1D_SIZE_KB=$(L1D_SIZE_KB)

# Set both EXTRA_AFLAGS (old kernels) and asflags-y (new kernels) for compatibility
EXTRA_AFLAGS += $(COMMON_AFLAGS)
asflags-y += $(COMMON_AFLAGS)

# ==================================================================================================
# Workarounds
# ==================================================================================================
# Suppress objtool warnings - a lot of code in the module violates the checks intentionally,
# so it's impossible to fix
GREP_FILTER = "return found in RETHUNK|indirect call found in RETPOLINE|call without frame pointer|undefined stack stae|return with modified stack frame|unsupported instruction in callable|undefined stack state|ENDBR: "
OBJECT_FILES_NON_STANDARD := y

# File-specific flags
CFLAGS_code_loader.o := -Wno-attribute-warning # workaround for __write_overflow_field warning

# ==================================================================================================
# build targets
# ==================================================================================================
all:
ifndef VMBUILD
ifeq ($(is_vm_vendor), 'yes')
	$(error ERROR: VM or WSL environment detected; use `make VMBUILD=1`)
endif
endif
	make -C $(KDIR) M=$(PWD) -j modules 2>&1 | grep -vE $(GREP_FILTER)

clean:
	make -C $(KDIR) M=$(PWD) clean

install:
	sudo insmod $(NAME).ko

uninstall:
	sudo rmmod $(NAME) || true

# --------------- debugging crushes ---------------
dbg_symbols:
	objcopy --only-keep-debug $(NAME).o $(NAME).dbg
	sudo cat /sys/module/$(NAME)/sections/.text
# continue manually with gdb:
# (if the executor is in a VM):
#       scp vm:revizor_dir/$rvzr_executor.dbg .
# gdb -ex "target remote localhost:1234" -ex "set substitute-path /home/revizor_dir /home/revizor_dir"
#   target remote localhost:1234
#   add-symbol-file rvzr_executor.dbg <addr>  # addr is the address printed by the cat command above
#   b run_experiment  # or any other function that you want to debug
#   (if guest VM path does not match the host path):
#       set substitute-path /home/revizor_dir /home/revizor_dir
#   c


================================================
FILE: rvzr/executor_km/arm64/asm_snippets.h
================================================
/// File: Building blocks for creating macros; ARM64 version
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _ARM64_ASM_SNIPPETS_H_
#define _ARM64_ASM_SNIPPETS_H_

#include "hardware_desc.h"
#include "measurement.h"
#include "registers.h"

/// State machine of the tracing process
#define SET_SR_STARTED()                                                                           \
    "and " STATUS_REGISTER_32 ", " STATUS_REGISTER_32 ", #0xFFFFFF00 \n"                           \
    "orr " STATUS_REGISTER_32 ", " STATUS_REGISTER_32 ", " xstr(STATUS_STARTED) " \n"
#define SET_SR_ENDED()                                                                             \
    "and " STATUS_REGISTER_32 ", " STATUS_REGISTER_32 ", #0xFFFFFF00 \n"                           \
    "orr " STATUS_REGISTER_32 ", " STATUS_REGISTER_32 ", " xstr(STATUS_ENDED) " \n"
#define TEST_SR_ENDED()                                                                            \
    "mov x16, " STATUS_REGISTER " \n"                                                              \
    "and x16, x16, #0xFF \n"                                                                       \
    "cmp x16, " xstr(STATUS_ENDED) " \n"

/// ================================================================================================
/// Shortcuts
/// ================================================================================================
#define SPEC_FENCE()      "dsb SY \n isb \n"
#define CACHE_FLUSH(ADDR) "dc civac, " ADDR "\n"

// clang-format off
#define mov_imm_to_reg(DEST, SRC)                                                                      \
    "movz " DEST ", #(" xstr(SRC) ") & 0xFFFF, lsl #0 \n"                                          \
    "movk " DEST ", #(" xstr(SRC) " >> 16) & 0xFFFF, lsl #16 \n"                                   \
    "movk " DEST ", #(" xstr(SRC) " >> 32) & 0xFFFF, lsl #32 \n"                                   \
    "movk " DEST ", #(" xstr(SRC) " >> 48) & 0xFFFF, lsl #48 \n"
// clang-format on

/// ================================================================================================
/// MSR and Performance Counter accessors
/// ================================================================================================

// clobber: x16
#define READ_MSR_START(ID, DEST)                                                                   \
    SPEC_FENCE()                                                                                   \
    "mov " DEST ", #0 \n"                                                                          \
    "mrs x16, " ID " \n"                                                                           \
    "sub " DEST ", " DEST ", x16 \n"

// clobber: x16
#define READ_MSR_END(ID, DEST)                                                                     \
    SPEC_FENCE()                                                                                   \
    "mrs x16, " ID " \n"                                                                           \
    "add " DEST ", " DEST ", x16 \n"

// clobber: x16 (dest)
#define READ_ONE_PFC(ID, DEST)                                                                     \
    "mov " DEST ", " ID " \n"                                                                      \
    "msr pmselr_el0, " DEST " \n"                                                                  \
    "mrs " DEST ", pmxevcntr_el0 \n"

// clobber: x16, PFC0, PFC1, PFC2
// clang-format off
#define READ_PFC_START() \
        SPEC_FENCE() \
        "mov " PFC0 ", #0 \n" \
        "mov " PFC1 ", #0 \n" \
        "mov " PFC2 ", #0 \n" \
        READ_ONE_PFC("1", "x16") \
        "sub " PFC0 ", " PFC0 ", x16 \n" \
        READ_ONE_PFC("2", "x16") \
        "sub " PFC1 ", " PFC1 ", x16 \n"

// clobber: rax, rcx, rdx
#define READ_PFC_END() \
        SPEC_FENCE() \
        READ_ONE_PFC("1", "x16") \
        "add " PFC0 ", " PFC0 ", x16 \n" \
        READ_ONE_PFC("2", "x16") \
        "add " PFC1 ", " PFC1 ", x16 \n"
// clang-format on

/// ================================================================================================
/// Detection of Interrupts
/// ================================================================================================
/// @brief Start monitoring SMIs by reading the current value of the SMI counter (MSR ???)
///        and storing it in the STATUS_REGISTER[63:32]
///  clobber:
#define READ_SMI_START() // FIXME: unimplemented

/// @brief End monitoring SMIs by reading the current value of the SMI counter (MSR ???))
///        and storing the difference between the current and the previous value
///        in the STATUS_REGISTER[31:0]
/// clobber: x1 [dest]
#define READ_SMI_END() // FIXME: unimplemented

/// ================================================================================================
/// Pre- and Post- measurement macros
/// ================================================================================================

/// @brief Loading of register values from the main actor's memory
/// clobber: x0-x7, nzcv, sp
// clang-format off
#define SET_REGISTER_FROM_INPUT() \
    asm volatile("\n"   \
    "mov x0, #"xstr(REG_INIT_OFFSET)" \n" \
    "add sp, "MEMORY_BASE_REGISTER", x0 \n" \
    "ldp x0, x1, [sp], #16\n" \
    "ldp x2, x3, [sp], #16\n" \
    "ldp x4, x5, [sp], #16\n" \
    "ldp x6, x7, [sp], #16\n" \
    "msr nzcv, x6\n" \
    "mov sp, x7\n");
// clang-format on

/// ================================================================================================
/// Measurement primitives
/// ================================================================================================

// clang-format off
#if L1D_ASSOCIATIVITY == 2
#define PRIME_ONE_SET(BASE, OFFSET, TMP, ACC) \
    "mov "TMP", "BASE" \n" \
    "add "TMP", "TMP", "OFFSET" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n"
#elif L1D_ASSOCIATIVITY == 4
#define PRIME_ONE_SET(BASE, OFFSET, TMP, ACC) \
    "mov "TMP", "BASE" \n" \
    "add "TMP", "TMP", "OFFSET" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n"
#elif L1D_ASSOCIATIVITY == 8
#define PRIME_ONE_SET(BASE, OFFSET, TMP, ACC) \
    "mov "TMP", "BASE" \n" \
    "add "TMP", "TMP", "OFFSET" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n" \
    "add "TMP", "TMP", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "add "TMP", "TMP", "ACC" \n" \
    "ldr "ACC", ["TMP"]\n"
#else
#error "Unsupported L1D_ASSOCIATIVITY"
#endif
// clang-format on

/// @brief Prime part of the Prime+Probe attack
// clobber: none
// clang-format off
#define PRIME(BASE, OFFSET, TMP, DEPENDENCY_REGISTER, REP_COUNTER, MAX_REPS) \
    SPEC_FENCE() \
    "mov "REP_COUNTER", "MAX_REPS"\n" \
    "1: \n" \
        "mov "OFFSET", 0 \n" \
        "mov "DEPENDENCY_REGISTER", 0 \n" \
        "2: \n" \
            SPEC_FENCE() \
            PRIME_ONE_SET(BASE, OFFSET, TMP, DEPENDENCY_REGISTER) \
            "add "OFFSET", "OFFSET", #64 \n" \
            "cmp "OFFSET", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
            "b.lt 2b \n" \
        "sub "REP_COUNTER", "REP_COUNTER", #1 \n" \
        "cmp "REP_COUNTER", xzr \n" \
        "b.ne 1b \n" \
    SPEC_FENCE()
// clang-format on

// clang-format off
/// @brief Probe part of the Prime+Probe attack
// clobber: none
// clang-format off
#define PROBE(BASE, OFFSET, DEPENDENCY_REGISTER, EVICT_COUNT, TMP, TRACE) \
    "mov "TRACE", 0 \n" \
    "mov "DEPENDENCY_REGISTER", 0 \n" \
    "mov "OFFSET", #"xstr(L1D_CONFLICT_DISTANCE)" \n" \
    "sub "OFFSET", "OFFSET", #64 \n" \
    "1: \n" \
        SPEC_FENCE() \
        READ_ONE_PFC("0", EVICT_COUNT) \
        SPEC_FENCE() \
        PRIME_ONE_SET(BASE, OFFSET, TMP, DEPENDENCY_REGISTER) \
        SPEC_FENCE() \
        READ_ONE_PFC("0", TMP) \
        "cmp "TMP", "EVICT_COUNT" \n" \
        "b.eq 2f \n" \
        "  orr "TRACE", "TRACE", #1 \n" \
        "2: \n" \
        "mov "TRACE", "TRACE", ror #1 \n" \
        "sub "OFFSET", "OFFSET", #64 \n" \
        "cmp "OFFSET", xzr \n" \
        "b.ge 1b \n" \
    SPEC_FENCE()
// clang-format on

/// @brief Flush part of the Flush+Reload
// clobber: none
// clang-format off
#define FLUSH(BASE, OFFSET, TMP) \
    "mov "OFFSET", #0 \n" \
    "1: \n" \
        "add "TMP", "BASE", "OFFSET" \n" \
        CACHE_FLUSH(TMP) \
        "add "OFFSET", "OFFSET", #64 \n" \
        "cmp "OFFSET", #0x1000\n" \
        "b.lt 1b \n" \
    SPEC_FENCE()
// clang-format on

/// @brief Reload part of the Flush+Reload
// clobber: none
// clang-format off
#define RELOAD(BASE, OFFSET, TMP, EVICT_COUNT, TRACE) \
    "mov "OFFSET", 0 \n" \
    "mov "TRACE", 0 \n" \
    "1: \n" \
        SPEC_FENCE() \
        READ_ONE_PFC("0", EVICT_COUNT) \
        SPEC_FENCE() \
        "add "TMP", "BASE", "OFFSET" \n" \
        "ldr "TMP", ["TMP"] \n" \
        SPEC_FENCE() \
        READ_ONE_PFC("0", TMP) \
        "mov "TRACE", "TRACE", lsl #1 \n" \
        "cmp "TMP", "EVICT_COUNT" \n" \
        "b.ne 2f \n" \
        "  orr "TRACE", "TRACE", #1 \n" \
        "2: \n" \
        "add "OFFSET", "OFFSET", #64 \n" \
        "cmp "OFFSET", #0x1000 \n" \
        "b.lt 1b \n" \
    SPEC_FENCE()
// clang-format on

#endif // _ARM64_ASM_SNIPPETS_H_


================================================
FILE: rvzr/executor_km/arm64/entry_exit_points.h
================================================
/// File: Test case entry and exit points; used by code_loader.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

// -----------------------------------------------------------------------------------------------
// Note on registers.
// Some of the registers are reserved for a specific purpose and should never be overwritten.
// See ./docs/registers.md for more information.

#ifndef _ENTRY_EXIT_H_
#define _ENTRY_EXIT_H_

#include "asm_snippets.h"

#define TEMPLATE_START                     0x0000111100001111
#define TEMPLATE_INSERT_TC                 0x0000222200002222
#define TEMPLATE_DEFAULT_EXCEPTION_LANDING 0x0000333300003333
#define TEMPLATE_END                       0x0000444400004444
#define TEMPLATE_MARKER_SIZE               8

// clang-format off
static inline void prologue(void)
{
    // As we don't use a compiler to track clobbering,
    // we have to save the callee-saved regs
    asm volatile("" \
        "stp x16, x17, [sp, #-16]!\n"
        "stp x18, x19, [sp, #-16]!\n"
        "stp x20, x21, [sp, #-16]!\n"
        "stp x22, x23, [sp, #-16]!\n"
        "stp x24, x25, [sp, #-16]!\n"
        "stp x26, x27, [sp, #-16]!\n"
        "stp x28, x29, [sp, #-16]!\n"
        "str x30, [sp, #-16]!\n"

        // x20 = main_area of actor 0 (passed in x0, the first argument of measurement_code)
        "mov "MEMORY_BASE_REGISTER", x0\n"

        // x21 = sandbox->util (x20 - UTIL_REL_TO_MAIN)
        "mov "UTIL_BASE_REGISTER", "MEMORY_BASE_REGISTER"\n"
        mov_imm_to_reg("x0", UTIL_REL_TO_MAIN)
        "sub "UTIL_BASE_REGISTER", "UTIL_BASE_REGISTER", x0\n"

        // sandbox->util->stored_rsp = sp
        "mov x0, sp\n"
        "mov x1, #"xstr(STORED_RSP_OFFSET)"\n"
        "add x1, "UTIL_BASE_REGISTER", x1\n"
        "str x0, [x1]\n"

        // clear the rest of the registers
        "mov x0, 0\n"
        "mov x1, 0\n"
        "mov x2, 0\n"
        "mov x3, 0\n"
        "mov x4, 0\n"
        "mov x5, 0\n"
        "mov x6, 0\n"
        "mov x7, 0\n"
        "mov x8, 0\n"
        "mov x9, 0\n"
        "mov x10, 0\n"
        "mov x11, 0\n"
        "mov x12, 0\n"
        "mov x13, 0\n"
        "mov x14, 0\n"
        "mov x15, 0\n"

        // initialize special registers
        "mov "HTRACE_REGISTER", 0\n"
        mov_imm_to_reg(STATUS_REGISTER, STATUS_UNINITIALIZED)

        // create space on stack
        // "mov rbp, rsp\n"
        "sub sp, sp, #0x1000\n"

        // start monitoring interrupts
        READ_SMI_START()
    );


}

static inline void epilogue(void)
{
    asm volatile(""
        READ_SMI_END()

        // x0 = &latest_measurement
        "mov x0, "UTIL_BASE_REGISTER"\n"
        mov_imm_to_reg("x1", MEASUREMENT_OFFSET)
        "add x0, x0, x1\n"

        // Store the results
        "str "HTRACE_REGISTER", [x0]\n"     // HTrace
        "str "PFC0", [x0, #8]\n"            // PFC0
        "str "PFC1", [x0, #16]\n"           // PFC1
        "str "PFC2", [x0, #24]\n"           // PFC2
        "str xzr, [x0, #32]\n"              // PFC3 (unused)
        "str xzr, [x0, #40]\n"              // PFC4 (unused)
        "str "STATUS_REGISTER", [x0, #48]\n" // Measurement status

        // rsp = sandbox->util->stored_rsp
        mov_imm_to_reg("x1", STORED_RSP_OFFSET)
        "add x1, "UTIL_BASE_REGISTER", x1\n"
        "ldr x0, [x1]\n"
        "mov sp, x0\n"

        // restore registers
        "ldr x30, [sp], #16\n"
        "ldp x28, x29, [sp], #16\n"
        "ldp x26, x27, [sp], #16\n"
        "ldp x24, x25, [sp], #16\n"
        "ldp x22, x23, [sp], #16\n"
        "ldp x20, x21, [sp], #16\n"
        "ldp x18, x19, [sp], #16\n"
        "ldp x16, x17, [sp], #16\n"

        // return 0
        "mov x0, 0\n"
        "ret\n"
    );
}

static inline void epilogue_dbg_gpr(void)
{
    asm volatile(""
        READ_SMI_END()

        // x7 = &latest_measurement
        "mov x7, "UTIL_BASE_REGISTER"\n"
        mov_imm_to_reg("x8", MEASUREMENT_OFFSET)
        "add x7, x7, x8\n"

        // Store the results
        "str x0, [x7]\n"
        "str x1, [x7, #8]\n"
        "str x2, [x7, #16]\n"
        "str x3, [x7, #24]\n"
        "str x4, [x7, #32]\n"
        "str x5, [x7, #40]\n"
        "str "STATUS_REGISTER", [x7, #48]\n"

        // rsp = sandbox->util->stored_rsp
        mov_imm_to_reg("x0", STORED_RSP_OFFSET)
        "add x0, "UTIL_BASE_REGISTER", x0\n"
        "ldr x0, [x0]\n"
        "mov sp, x0\n"

        // restore registers
        "ldr x30, [sp], #16\n"
        "ldp x28, x29, [sp], #16\n"
        "ldp x26, x27, [sp], #16\n"
        "ldp x24, x25, [sp], #16\n"
        "ldp x22, x23, [sp], #16\n"
        "ldp x20, x21, [sp], #16\n"
        "ldp x18, x19, [sp], #16\n"
        "ldp x16, x17, [sp], #16\n"

        // return 0
        "mov x0, 0\n"
        "ret\n"
    );
}
// clang-format on

static void main_segment_template(void)
{
    asm volatile(".quad " xstr(TEMPLATE_START));
    prologue();

    SET_REGISTER_FROM_INPUT();

    // test case placeholder
    asm volatile("isb\n dsb SY \n");
    asm volatile(".quad " xstr(TEMPLATE_INSERT_TC) "\n");
    asm volatile("isb\n dsb SY \n");

    // fault handler
    asm volatile("b 1f\n"
                 ".quad " xstr(TEMPLATE_DEFAULT_EXCEPTION_LANDING) "\n"
                                                                   "nop\n"
                                                                   "1:nop\n");

    epilogue();
    asm volatile(".quad " xstr(TEMPLATE_END));
}

static void main_segment_template_dbg_gpr(void)
{
    asm volatile(".quad " xstr(TEMPLATE_START));
    prologue();

    SET_REGISTER_FROM_INPUT();

    // test case placeholder
    asm volatile("isb\n dsb SY \n");
    asm volatile(".quad " xstr(TEMPLATE_INSERT_TC) "\n");
    asm volatile("isb\n dsb SY \n");

    asm volatile("b 1f\n"
                 ".quad " xstr(TEMPLATE_DEFAULT_EXCEPTION_LANDING) "\n"
                                                                   "nop\n"
                                                                   "1:nop\n");

    epilogue_dbg_gpr();
    asm volatile(".quad " xstr(TEMPLATE_END));
}

#endif // _ENTRY_EXIT_H_


================================================
FILE: rvzr/executor_km/arm64/exception.S
================================================
// File: Low-level exception handling code for ARM64
//
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/asm-bug.h>
// #include <asm/exception.h>

#include "sandbox_constants.h"
#include "registers.h"

.extern _printk
.extern set_outer_fault_handlers
.extern unset_outer_fault_handlers
.extern run_experiment
.extern orig_vector_table_ptr
.extern loaded_test_case_entry

.extern fault_handler
.extern is_nested_fault

// =================================================================================================
// Global variables
// =================================================================================================
.data

recovery_sp:
.quad 0

.Lunreachable_msg:
.asciz	"ERROR: rvzr_executor: unreachable code\n"
.align

.Lunexpected_fault_msg:
.asciz	"\0013 ERROR: [fallback_handler] Unexpected fault in run_experiment: \n\
1 [Error Syndrome]:\t0x%llx\n\
2 [Fault Address]:\t0x%llx\n\
  (run_experiment start:\t0x%llx)\n\
3 [SP]:\t0x%llx\n"
.align

.Ldefault_fault_msg:
.asciz	"\0013 ERROR: [test_case_handler] Unhandled fault in the test case: \n\
1 [Error Syndrome]:\t0x%llx\n\
2 [Fault Address]:\t0x%llx\n\
  (test case start:\t0x%llx)\n\
3 [SP]:\t0x%llx\n"
.align


// =================================================================================================
// Macros
// =================================================================================================
.macro unreachable
    adr	x0, .Lunreachable_msg
    mov	x2, lr
    b panic
.endm


// =================================================================================================
// Custom vector tables
// =================================================================================================
.text

/// @brief The vector table used for catching bugs in run_experiment function
///        This table exists purely for convenience during the development process and
///        should be unreachable during normal operation
.global outer_vector_table
.balign 2048
outer_vector_table:
    // Interrupts/exceptions from EL1 to EL1; using SP_EL1 as sp
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    // Interrupts/exceptions from EL1 to EL1; using SP_ELX as sp
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    // Interrupts/exceptions from EL0 to EL1; in AArch64 mode
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    .balign 0x80
        b fallback_handler
    // Interrupts/exceptions from EL0 to EL1; in AArch32 mode
    .balign 0x80
        unreachable
    .balign 0x80
        unreachable
    .balign 0x80
        unreachable
    .balign 0x80
        unreachable

/// @brief The vector table used for redirecting exceptions in tests cases to the recovery code
///        In contrast to the outer_vector_table, this table is actively used during normal
///        operation, especially when testing for Meltdown-like vulnerabilities
.global inner_vector_table
.balign 2048
inner_vector_table:
    // Interrupts/exceptions from EL1 to EL1; using SP_EL1 as sp (EL1t)
    .balign 0x80   // Synchronous
        b test_case_handler
    .balign 0x80  // IRQ
        b test_case_handler
    .balign 0x80  // FIQ
        b test_case_handler
    .balign 0x80  // SError
        b test_case_handler
    // Interrupts/exceptions from EL1 to EL1; using SP_ELX as sp (EL1h)
    .balign 0x80  // Synchronous
        // Handle all other exceptions
        b test_case_handler
    .balign 0x80  // IRQ
        b test_case_handler
    .balign 0x80  // FIQ
        b test_case_handler
    .balign 0x80  // SError
        b test_case_handler
    // Interrupts/exceptions from EL0 to EL1; in AArch64 mode
    .balign 0x80   // Synchronous
        b test_case_handler
    .balign 0x80  // IRQ
        b test_case_handler
    .balign 0x80  // FIQ
        b test_case_handler
    .balign 0x80  // SError
        b test_case_handler
    // Interrupts/exceptions from EL0 to EL1; in AArch32 mode
    .balign 0x80
        b test_case_handler
    .balign 0x80
        b test_case_handler
    .balign 0x80
        b test_case_handler
    .balign 0x80
        b test_case_handler

// =================================================================================================
// Handlers
// =================================================================================================
.text

/// @brief The default handler that terminates the tracing process
///        by directly jumping to the exit point of the run_experiment function
.global fallback_handler
fallback_handler:
    mrs x1, esr_el1
    mrs x2, far_el1  // FIXME: this doesn't work for many exception types
    adr x3, run_experiment
    mov x4, sp
    adr x5, .Lunexpected_fault_msg

    // set the return address to the recovery code
    adr x0, .run_experiment_recovery
    msr elr_el1, x0
    eret


/// @brief A handler for all exceptions that occur during the test case execution
.global test_case_handler
test_case_handler:
    // check for nested faults
    adr TMP_REG1_, is_nested_fault
    ldr TMP_REG2_, [TMP_REG1_]
    cmp TMP_REG2_, #0
    b.ne .test_case_handler.default
    mov TMP_REG2_, #1
    str TMP_REG2_, [TMP_REG1_]

    // check if a custom handler is registered
    adr TMP_REG2_, fault_handler
    ldr TMP_REG2_, [TMP_REG2_]
    cmp TMP_REG2_, #0
    b.eq .test_case_handler.default

    .test_case_handler.registered_handler:
    msr elr_el1, TMP_REG2_
    eret

    .test_case_handler.default:
    mrs x1, esr_el1
    mrs x2, far_el1  // FIXME: this doesn't work for many exception types
    adr x3, loaded_test_case_entry
    ldr x3, [x3]
    mov x4, sp
    adr x5, .Ldefault_fault_msg

    adr x0, .run_experiment_recovery
    msr elr_el1, x0
    eret


// =================================================================================================
// run_experiment_outer: Fault-tolerant wrapper for run_experiment
// =================================================================================================
.text

/// @brief A wrapper over run_experiment that ensures that any bugs that cause an
///        exception will be handled gracefully and won't crash the system
/// @param void
.global run_experiment_outer
run_experiment_outer:
    // A bug in run_experiment may corrupt the CPU state, so we need to save the current state
    // before calling run_experiment
    stp x1, x2, [sp, -16]!
    stp x3, x4, [sp, -16]!
    stp x5, x6, [sp, -16]!
    stp x7, x8, [sp, -16]!
    stp x9, x10, [sp, -16]!
    stp x11, x12, [sp, -16]!
    stp x13, x14, [sp, -16]!
    stp x15, x16, [sp, -16]!
    stp x17, x18, [sp, -16]!
    stp x19, x20, [sp, -16]!
    stp x21, x22, [sp, -16]!
    stp x23, x24, [sp, -16]!
    stp x25, x26, [sp, -16]!
    stp x27, x28, [sp, -16]!
    stp x29, x30, [sp, -16]!

    // ??? no idea why this is needed ???
    mov x21, sp

    // Save the SP into a global variables so that we can recover it after a destructive bug
    mov x0, sp
    adr x1, recovery_sp
    str x0, [x1]

    // Set up a custom vector table
    bl set_outer_fault_handlers

    // Call run_experiment
    bl run_experiment
    b .run_experiment_normal_exit
.run_experiment_recovery:
    // Overwrite SP with recovery_sp
    adr TMP_REG1_, recovery_sp
    ldr TMP_REG2_, [TMP_REG1_]
    mov sp, TMP_REG2_

    // ??? no idea why this is needed ???
    mov x21, sp

    // Print an error message
    // x1 already contains the fault code from the fault handler
    mov x0, x5
    bl _printk
    mov x0, #1

.run_experiment_normal_exit:
    // Restore the original vector table
    stp x0, x1, [sp, -16]!
    bl unset_outer_fault_handlers
    ldp x0, x1, [sp], 16

    // Restore the CPU state in case run_experiment has corrupted it
    ldp x29, x30, [sp], 16
    ldp x27, x28, [sp], 16
    ldp x25, x26, [sp], 16
    ldp x23, x24, [sp], 16
    ldp x21, x22, [sp], 16
    ldp x19, x20, [sp], 16
    ldp x17, x18, [sp], 16
    ldp x15, x16, [sp], 16
    ldp x13, x14, [sp], 16
    ldp x11, x12, [sp], 16
    ldp x9, x10, [sp], 16
    ldp x7, x8, [sp], 16
    ldp x5, x6, [sp], 16
    ldp x3, x4, [sp], 16
    ldp x1, x2, [sp], 16

    ret


================================================
FILE: rvzr/executor_km/arm64/fault_handler.c
================================================
/// File: Fault handling and vector table management on ARM64 (i.e., aarch64)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/interrupt.h>

#include "code_loader.h"
#include "main.h"
#include "measurement.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

#include "fault_handler.h"

typedef uint32_t opcode_t; // opcodes in ARM64 are 32-bit

typedef struct {
    opcode_t code[32];
} __attribute__((packed)) vector_table_entry_t;

typedef struct {
    vector_table_entry_t vector_table[16];
} __attribute__((packed)) vector_table_t;

extern vector_table_t outer_vector_table;
extern vector_table_t inner_vector_table;

uint32_t handled_faults = 0;  // global
char *fault_handler = NULL;   // global
uint64_t is_nested_fault = 0; // shared with exception.S

vector_table_t *orig_vector_table_ptr = NULL;

// =================================================================================================
// Vector table management
// =================================================================================================
static inline vector_table_t *vbar_el1_read(void)
{
    vector_table_t *vbar_el1 = NULL;
    asm volatile("mrs %0, vbar_el1" : "=r"(vbar_el1));
    return vbar_el1;
}

static inline void vbar_el1_write(vector_table_t *vbar_el1)
{
    asm volatile("msr vbar_el1, %0" ::"r"(vbar_el1));
}

void set_outer_fault_handlers(void)
{
    // Save the original vector table
    orig_vector_table_ptr = vbar_el1_read();

    // Set VBAR to point to our custom vector table
    vbar_el1_write(&outer_vector_table);
}

void unset_outer_fault_handlers(void)
{
    // Restore the original vector table
    vbar_el1_write(orig_vector_table_ptr);
}

void set_inner_fault_handlers(void)
{
    is_nested_fault = 0;
    vbar_el1_write(&inner_vector_table);
}

void unset_inner_fault_handlers(void) { vbar_el1_write(&outer_vector_table); }

// =================================================================================================
int init_fault_handler(void)
{
    handled_faults = HANDLED_FAULTS_DEFAULT;
    fault_handler = NULL;
    return 0;
}

void free_fault_handler(void) {}


================================================
FILE: rvzr/executor_km/arm64/macros.c
================================================
/// File: Management of test case macros
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "asm_snippets.h"
#include "fault_handler.h"
#include "macro_expansion.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

// =================================================================================================
// Convenience shortcuts for writing constants to memory
// =================================================================================================
#define APPEND_U8_TO_DEST(value) dest[cursor++] = value;

#define APPEND_U16_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint16_t *)(dest + cursor)) = value;                                                    \
        cursor += 2;                                                                               \
    }

#define APPEND_U32_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint32_t *)(dest + cursor)) = value;                                                    \
        cursor += 4;                                                                               \
    }

#define APPEND_U64_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint64_t *)(dest + cursor)) = value;                                                    \
        cursor += 8;                                                                               \
    }

#define APPEND_BYTES_TO_DEST(...)                                                                  \
    {                                                                                              \
        static const uint8_t bytes[] = {__VA_ARGS__};                                              \
        for (size_t i = 0; i < sizeof(bytes); i++) {                                               \
            dest[cursor++] = bytes[i];                                                             \
        }                                                                                          \
    }

// =================================================================================================
// Instruction opcodes
// =================================================================================================
static inline uint32_t movz(uint8_t rd, uint16_t imm16, uint8_t shift)
{
    uint32_t opcode = 0xd2800000;
    opcode |= rd;                    // set destination register
    opcode |= (imm16 & 0xffff) << 5; // set immediate
    opcode |= shift << 21;           // set shift
    return opcode;
}

static inline uint32_t movk(uint8_t rd, uint16_t imm16, uint8_t shift)
{
    uint32_t opcode = 0xf2800000;
    opcode |= rd;                    // set destination register
    opcode |= (imm16 & 0xffff) << 5; // set immediate
    opcode |= shift << 21;           // set shift
    return opcode;
}

static inline uint32_t mov_to_sp(uint8_t rd) { return 0x9100001f | (rd << 5); }

static inline uint32_t b_imm(uint32_t offset)
{
    // offsets in ARM are in dwords
    offset = offset / 4;

    // the target for a jump is a 26-bit signed offset from the current PC
    int sign = offset < 0 ? 1 : 0;
    offset = (offset & 0x3FFFFFF) | (sign << 25);

    return 0x14000000 | offset;
}

/// @brief mov rd, rn
static inline uint32_t mov_reg(uint8_t rd, uint8_t rn)
{
    uint32_t opcode = 0xaa0003e0;
    opcode |= rd;               // set destination register
    opcode |= (rn & 0x1f) << 5; // set source register
    return opcode;
}

/// @brief add rd, rn, rm
static inline uint32_t add_reg(uint8_t rd, uint8_t rn, uint8_t rm)
{
    uint32_t opcode = 0x8b000000;
    opcode |= rd;                // set destination register
    opcode |= (rn & 0x1f) << 5;  // set first source register
    opcode |= (rm & 0x1f) << 16; // set second source register
    return opcode;
}

/// @brief str rt, [rn]
static inline uint32_t str_reg(uint8_t rt, uint8_t rn)
{
    uint32_t opcode = 0xf9000000;
    opcode |= rt;               // set source register
    opcode |= (rn & 0x1f) << 5; // set base register
    return opcode;
}

/// @brief ldr rt, [rn]
static inline uint32_t ldr_reg(uint8_t rt, uint8_t rn)
{
    uint32_t opcode = 0xf9400000;
    opcode |= rt;               // set destination register
    opcode |= (rn & 0x1f) << 5; // set base register
    return opcode;
}

// =================================================================================================
// Helper functions
// =================================================================================================
/// @brief Insert a sequence of instructions into dest that moves a 64-bit immediate value
///        into a register
/// @param rd Destination register (0-31)
/// @param value 64-bit immediate value
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static inline uint64_t mov_uint64_to_reg(uint8_t rd, uint64_t value, uint8_t *dest, uint64_t cursor)
{
    int old_cursor = cursor;
    uint32_t opcode = movz(rd, value & 0xffff, 0);
    APPEND_U32_TO_DEST(opcode);

    opcode = movk(rd, value >> 16 & 0xffff, 1);
    APPEND_U32_TO_DEST(opcode);

    opcode = movk(rd, value >> 32 & 0xffff, 2);
    APPEND_U32_TO_DEST(opcode);

    opcode = movk(rd, value >> 48 & 0xffff, 3);
    APPEND_U32_TO_DEST(opcode);

    return cursor - old_cursor;
}

/// @brief Get the address of a function within a section
/// @param section_id ID of the section
/// @param function_id ID of the function
/// @return Virtual address of the function
static uint64_t get_function_addr(int section_id, int function_id)
{
    uint64_t section_base = 0;
    section_base = (uint64_t)sandbox->code[section_id].section;

    // The code section of the main actor begins after a hardcoded prologue,
    // which we need to take into account when calculating the function address
    if (section_id == 0)
        section_base += get_main_prologue_size();

    return section_base + test_case->symbol_table[function_id].offset;
}

/// @brief Insert a sequence of instructions into dest that updates memory base register
///        to point to the base address of the memory owned by actor with `section_id`
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_memory_base_reg(int section_id, uint8_t *dest, uint64_t cursor)
{
    int old_cursor = cursor;

    // calculate the new memory base register value
    uint64_t new_val = 0;
    new_val = (uint64_t)sandbox->data[section_id].main_area;
    uint8_t rd = MEMORY_BASE_REGISTER_ID;
    cursor += mov_uint64_to_reg(rd, new_val, dest, cursor);

    return cursor - old_cursor;
}

/// @brief Insert a sequence of instructions into dest that updates memory base register
///        and sp to match the actor owning section_id
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_mem_base_and_sp(int section_id, uint8_t *dest, uint64_t cursor)
{
    int old_cursor = cursor;
    cursor += update_memory_base_reg(section_id, dest, cursor);

    // calculate the new sp value
    uint64_t new_sp = 0;
    new_sp = (uint64_t)sandbox->data[section_id].main_area + LOCAL_RSP_OFFSET;
    cursor += mov_uint64_to_reg(TMP_REG1_ID, new_sp, dest, cursor);

    // ASM: mov sp, SCRATCH_REG
    uint32_t opcode = mov_to_sp(TMP_REG1_ID);
    APPEND_U32_TO_DEST(opcode);

    return cursor - old_cursor;
}

/// @brief Insert a sequence of instructions into dest that updates x21 (util base register)
///        to point to the base address of the util region
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_util_base_reg(int section_id, uint8_t *dest, uint64_t cursor)
{
    int old_cursor = cursor;

    // calculate the new x21 value
    uint64_t new_val = 0;
    new_val = (uint64_t)sandbox->util;
    uint8_t rd = UTIL_BASE_REGISTER_ID;
    cursor += mov_uint64_to_reg(rd, new_val, dest, cursor);

    return cursor - old_cursor;
}

// =================================================================================================
// Macro implementations
//
// Note: A macro consists of two parts: it starts with the dynamically-generated part,
// and the main body is static.
// The dynamic part is generated by the start_macro* functions, and the generated code
// can be configured according to the macro arguments.
// The body_macro* functions are not configurable, and are copied directly into the test case
// macro memory.
// =================================================================================================

// MEASUREMENT_START and MEASUREMENT_END -----------------------------------------------------------
// Prime+Probe variants
static void __attribute__((noipa)) body_macro_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm volatile(""                                                               //
                 "mrs " TMP_REG6 ", nzcv \n"                                      //
                 "mov " TMP_REG1 ", " UTIL_BASE_REGISTER "\n"                     //
                 "add " TMP_REG1 ", " TMP_REG1 ", " xstr(L1D_PRIMING_OFFSET) "\n" //
                 PRIME(TMP_REG1, TMP_REG2, TMP_REG3, TMP_REG4, TMP_REG5, "8")     //
                 READ_PFC_START()                                                 //
                 SET_SR_STARTED()                                                 //
                 "msr nzcv, " TMP_REG6 "\n"                                       //
                 SPEC_FENCE()                                                     //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_fast_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm volatile(""                                                               //
                 "mrs " TMP_REG6 ", nzcv \n"                                      //
                 "mov " TMP_REG1 ", " UTIL_BASE_REGISTER "\n"                     //
                 "add " TMP_REG1 ", " TMP_REG1 ", " xstr(L1D_PRIMING_OFFSET) "\n" //
                 PRIME(TMP_REG1, TMP_REG2, TMP_REG3, TMP_REG4, TMP_REG5, "1")     //
                 READ_PFC_START()                                                 //
                 SET_SR_STARTED()                                                 //
                 "msr nzcv, " TMP_REG6 "\n"                                       //
                 SPEC_FENCE()                                                     //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_probe(void)
{
    // pseudocode:
    // tmp_reg6 = NZCV  // ensure that the macro doesn't corrupt flags
    // if (status != STATUS_ENDED)  // ensure that macro is executed only once
    //    read_pfc_end()
    //    htrace_register = probe(sandbox->util.l1d_priming_area)
    //    status = STATUS_ENDED
    // NZCV = tmp_reg6

    asm volatile(".quad " xstr(MACRO_START));
    asm volatile(""                                                                       //
                 "mrs " TMP_REG6 ", nzcv \n"                                              //
                 TEST_SR_ENDED()                                                          //
                 "b.eq 99f\n"                                                             //
                 READ_PFC_END()                                                           //
                 "mov " TMP_REG1 ", " UTIL_BASE_REGISTER "\n"                             //
                 "add " TMP_REG1 ", " TMP_REG1 ", " xstr(L1D_PRIMING_OFFSET) "\n"         //
                 PROBE(TMP_REG1, TMP_REG2, TMP_REG3, TMP_REG4, TMP_REG5, HTRACE_REGISTER) //
                 SET_SR_ENDED()                                                           //
                 "99:\n"                                                                  //
                 "msr nzcv, " TMP_REG6 "\n"                                               //
                 SPEC_FENCE()                                                             //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

// Flush + Reload and variants
static void __attribute__((noipa)) body_macro_flush(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm volatile(""                                             //
                 "mrs " TMP_REG6 ", nzcv \n"                    //
                 "mov " TMP_REG1 ", " MEMORY_BASE_REGISTER "\n" //
                 FLUSH(TMP_REG1, TMP_REG2, TMP_REG3)            //
                 READ_PFC_START()                               //
                 SET_SR_STARTED()                               //
                 "msr nzcv, " TMP_REG6 "\n"                     //
                 SPEC_FENCE()                                   //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_reload(void)
{
    // pseudocode:
    // tmp_reg6 = NZCV  // ensure that the macro doesn't corrupt flags
    // if (status != STATUS_ENDED)  // ensure that macro is executed only once
    //    read_pfc_end()
    //    htrace_register = reload(sandbox->main)
    //    status = STATUS_ENDED
    // NZCV = tmp_reg6

    asm volatile(".quad " xstr(MACRO_START));
    asm volatile(""                                                              //
                 "mrs " TMP_REG6 ", nzcv \n"                                     //
                 TEST_SR_ENDED()                                                 //
                 "b.eq 99f\n"                                                    //
                 READ_PFC_END()                                                  //
                 "mov " TMP_REG1 ", " MEMORY_BASE_REGISTER "\n"                  //
                 RELOAD(TMP_REG1, TMP_REG2, TMP_REG3, TMP_REG4, HTRACE_REGISTER) //
                 SET_SR_ENDED()                                                  //
                 "99:\n"                                                         //
                 "msr nzcv, " TMP_REG6 "\n"                                      //
                 SPEC_FENCE()                                                    //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

// FAULT_HANDLER -------------------------------------------------------------------------------
static inline size_t start_macro_fault_handler(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;

    // The fault handler must be owned by the main actor
    ASSERT(args.owner == 0, "inject_macro_configurable_part");

    // Set new global address to the fault handler
    fault_handler = (char *)((uint64_t)dest + cursor);

    // Ensure that SP, memory base, and util base
    // are set to correct values after (potential) actor switch
    cursor += update_mem_base_and_sp(0, dest, cursor);
    cursor += update_util_base_reg(0, dest, cursor);

    return cursor;
}

// MACRO_SWITCH ------------------------------------------------------------------------------------
static inline size_t start_macro_switch(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    // Update sp and x30 to the addresses within the new actor's memory
    cursor += update_mem_base_and_sp(args.arg1, dest, cursor);

    // Determine the target address for the switch
    uint64_t switch_target = get_function_addr(args.arg1, args.arg2);
    uint32_t relative_offset = switch_target - (uint64_t)dest - cursor;

    // Jump to the target address (in a different actor) via a relative offset
    uint32_t opcode = b_imm(relative_offset);
    APPEND_U32_TO_DEST(opcode);

    return cursor;
}

// =================================================================================================
// Macro descriptors
// =================================================================================================
macro_descr_t macro_descriptors[] = {
    [TYPE_UNDEFINED] = {.start = NULL, .body = NULL},
    [TYPE_PRIME] = {.start = NULL, .body = body_macro_prime},
    [TYPE_FAST_PRIME] = {.start = NULL, .body = body_macro_fast_prime},
    [TYPE_PARTIAL_PRIME] = {.start = NULL, .body = NULL},
    [TYPE_FAST_PARTIAL_PRIME] = {.start = NULL, .body = NULL},
    [TYPE_PROBE] = {.start = NULL, .body = body_macro_probe},
    [TYPE_FLUSH] = {.start = NULL, .body = body_macro_flush},
    [TYPE_EVICT] = {.start = NULL, .body = body_macro_prime},
    [TYPE_RELOAD] = {.start = NULL, .body = body_macro_reload},
    [TYPE_TSC_START] = {.start = NULL, .body = NULL},
    [TYPE_TSC_END] = {.start = NULL, .body = NULL},
    [TYPE_FAULT_HANDLER] = {.start = start_macro_fault_handler, .body = NULL},
    [TYPE_FAULT_AND_PROBE] = {.start = start_macro_fault_handler, .body = body_macro_probe},
    [TYPE_FAULT_AND_RELOAD] = {.start = start_macro_fault_handler, .body = body_macro_reload},
    [TYPE_FAULT_AND_TSC_END] = {.start = NULL, .body = NULL},
    [TYPE_SWITCH] = {.start = start_macro_switch, .body = NULL},
    [TYPE_SET_K2U_TARGET] = {.start = NULL, .body = NULL},
    [TYPE_SWITCH_K2U] = {.start = NULL, .body = NULL},
    [TYPE_SET_U2K_TARGET] = {.start = NULL, .body = NULL},
    [TYPE_SWITCH_U2K] = {.start = NULL, .body = NULL},
    [TYPE_SET_H2G_TARGET] = {.start = NULL, .body = NULL},
    [TYPE_SWITCH_H2G] = {.start = NULL, .body = NULL},
    [TYPE_SET_G2H_TARGET] = {.start = NULL, .body = NULL},
    [TYPE_SWITCH_G2H] = {.start = NULL, .body = NULL},
    [TYPE_LANDING_K2U] = {.start = NULL, .body = NULL},
    [TYPE_LANDING_U2K] = {.start = NULL, .body = NULL},
    [TYPE_LANDING_H2G] = {.start = NULL, .body = NULL},
    [TYPE_LANDING_G2H] = {.start = NULL, .body = NULL},
    [TYPE_SET_DATA_PERMISSIONS] = {.start = NULL, .body = NULL},
};


================================================
FILE: rvzr/executor_km/arm64/page_tables_guest.c
================================================
/// File:
///  - Guest page table management
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

// #include <asm/io.h>
// #include <asm/msr.h>

#include "page_tables_guest.h"
#include "actor.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "page_tables_guest.h"

// eptp_t *ept_ptr = NULL; // global

// =================================================================================================
// Page table management interface
// =================================================================================================

int map_sandbox_to_guest_memory(void)
{
    int err = 0;
    UNIMPLEMENTED("map_sandbox_to_guest_memory");
    return err;
}

/// @brief Set permissions on the faulty page based on the actor's metadata (for each actor)
/// @param void
void set_faulty_page_guest_permissions(void) { return; }

void restore_faulty_page_guest_permissions(void) { return; }

/// @brief Set EPT permissions on the faulty page based on the actor's metadata (for each actor)
/// @param void
void set_faulty_page_ept_permissions(void) { return; }

void restore_faulty_page_ept_permissions(void) { return; }

// =================================================================================================
// Debugging Interfaces
// =================================================================================================

/// @brief Dump the guest page tables for a given actor
/// @param actor_id
/// @return 0 on success, -1 on failure
int dbg_dump_guest_page_tables(int actor_id) { return 0; }

int dbg_dump_ept(int actor_id) { return 0; }

// =================================================================================================
int allocate_guest_page_tables(void) { return 0; }

void free_guest_page_tables(void) {}


================================================
FILE: rvzr/executor_km/arm64/perf_counters.c
================================================
/// File: Configuration and use of performance counters
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/kernel.h>
#include <linux/types.h>

#include "main.h"
#include "shortcuts.h"

#include "perf_counters.h"
#include "shortcuts.h"

#define REQUIRED_N_COUNTERS 3

// =================================================================================================
// Constants and event IDs

// Performance Monitor Events
#define EVENT_L1D_CACHE_REFILL 0x03
#define EVENT_INST_RETIRED     0x08
#define EVENT_INST_SPEC        0x1b

// Perf counter controls
#define PMCR_ENABLE           BIT_(0)
#define PMCR_EVENT_CNTR_RESET BIT_(1)
#define PMCR_CYCLE_CNTR_RESET BIT_(2)
#define PMCR_DP               BIT_(5)
#define PMCR_N_COUNTER_START  11
#define PMCR_N_COUNTER_MASK   0b11111
#define MDCR_HPME             BIT_(7)
#define MDCR_HPMD             BIT_(17)
#define PMCNTENSET_P0         BIT_(0)
#define PMCNTENSET_P1         BIT_(1)
#define PMCNTENSET_P2         BIT_(2)
#define PMCNTENSET_C          BIT_(31)
#define PMCCFILTR_NSH         BIT_(27)
#define PMSELR_CYCLE_CNTR     0x1f

// =================================================================================================
// Private module-level functions
// =================================================================================================

/// @brief Get the current exception level (EL)
/// @param void
/// @return Exception level
static inline int get_current_exception_level(void)
{
    int val = 0;
    read_msr("CurrentEL", val);
    val = (val >> 2) & 0b11;
    return val;
}

/// @brief Enable the Performance Monitoring Unit in EL2
/// @param void
/// @return 0 on success, -1 on failure
static inline int pmu_enable_el2(void)
{
    uint64_t mdcr = 0;
    read_msr("MDCR_EL2", mdcr);
    mdcr = mdcr | MDCR_HPME;    // set MDCR_EL2.HPME = 1
    mdcr = mdcr & (~MDCR_HPMD); // set MDCR_EL2.HPMD = 0
    write_msr("MDCR_EL2", mdcr);
    return 0;
}

/// @brief Enable the Performance Monitoring Unit
/// @param void
/// @return 0 on success, -1 on failure
static inline int pmu_enable(void)
{
    uint64_t pmcr = 0;
    read_msr("PMCR_EL0", pmcr);
    write_msr("PMCR_EL0", (pmcr | PMCR_ENABLE) & (~PMCR_DP));
    return 0;
}

/// @brief Reset the Performance Monitoring Unit
/// @param void
/// @return 0 on success, -1 on failure
static inline int pmu_reset(void)
{
    uint64_t pmcr = 0;
    read_msr("PMCR_EL0", pmcr);
    write_msr("PMCR_EL0", pmcr | PMCR_EVENT_CNTR_RESET | PMCR_CYCLE_CNTR_RESET);
    return 0;
}

/// @brief Enable all counters
/// @param void
/// @return 0 on success, -1 on failure
static inline int enable_all_counters(void)
{
    // Check that the number of available counters matches our expected value
    uint64_t pmcr_value = 0;
    read_msr("PMCR_EL0", pmcr_value);
    uint64_t pmcr_n = (pmcr_value >> PMCR_N_COUNTER_START) & PMCR_N_COUNTER_MASK;
    ASSERT(pmcr_n >= REQUIRED_N_COUNTERS, "pmu_enable");

    // Enable all counters
    uint64_t enable_all = PMCNTENSET_P0 | PMCNTENSET_P1 | PMCNTENSET_P2 | PMCNTENSET_C;
    write_msr("PMCNTENSET_EL0", enable_all);

    return 0;
}

/// @brief Disable all PMU filtering
/// @param void
/// @return 0 on success, -1 on failure
static inline int disable_filtering(void)
{
    write_msr("PMCCFILTR_EL0", PMCCFILTR_NSH);
    return 0;
}

/// @brief Set perf events to the expected values
/// Currently, the events are hardcoded to:
///   - counter 0: L1D_CACHE_REFILL
///   - counter 1: INST_RETIRED
///   - counter 2: INST_SPEC
/// @param void
/// @return 0 on success, -1 on failure
static inline int configure_events(void)
{
    // Configure the cycle counter
    write_msr("PMSELR_EL0", PMSELR_CYCLE_CNTR);
    write_msr("PMXEVTYPER_EL0", PMCCFILTR_NSH);

    // Configure event counters
    write_msr("PMSELR_EL0", 0);
    write_msr("PMXEVTYPER_EL0", (PMCCFILTR_NSH | EVENT_L1D_CACHE_REFILL));

    write_msr("PMSELR_EL0", 1);
    write_msr("PMXEVTYPER_EL0", EVENT_INST_SPEC);

    write_msr("PMSELR_EL0", 2);
    write_msr("PMXEVTYPER_EL0", EVENT_INST_RETIRED);

    return 0;
}

// =================================================================================================
// Public interface
// =================================================================================================
int pfc_configure(void)
{
    // NOTE: the below implementation is based on the instructions from
    // "Arm Architecture Reference Manual for A-profile architecture"
    // Section "D13.1 About the Performance Monitors"

    int err = 0;

#ifndef VMBUILD
    if (get_current_exception_level() >= 2) {
        err = pmu_enable_el2();
        CHECK_ERR("pmu_enable_el2");
    }

    err = configure_events();
    CHECK_ERR("configure_events");

    err = pmu_reset();
    CHECK_ERR("pmu_reset");

    err = disable_filtering();
    CHECK_ERR("disable_filtering");

    err = enable_all_counters();
    CHECK_ERR("enable_all_counters");

    err = pmu_enable();
    CHECK_ERR("pmu_enable");

#endif // VMBUILD

    return err;
}

// =================================================================================================
int init_perf_counters(void) { return 0; }
void free_perf_counters(void) {}


================================================
FILE: rvzr/executor_km/arm64/registers.h
================================================
/// File: Symbolic names for pre-allocated registers; ARM64 version
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _ARM64_REGISTERS_H_
#define _ARM64_REGISTERS_H_

/// Reserved registers
#define STATUS_REGISTER         "x12"
#define STATUS_REGISTER_32      "w12"

#define HTRACE_REGISTER         "x13"

#define MEMORY_BASE_REGISTER    "x20"
#define MEMORY_BASE_REGISTER_ID 0x14

#define UTIL_BASE_REGISTER      "x21"
#define UTIL_BASE_REGISTER_     x21
#define UTIL_BASE_REGISTER_ID   0x15

#define TMP_REG1                "x28"
#define TMP_REG1_               x28
#define TMP_REG1_ID             0x1c

#define TMP_REG2                "x27"
#define TMP_REG2_               x27
#define TMP_REG2_ID             0x1b

#define TMP_REG3                "x26"
#define TMP_REG3_               x26

#define TMP_REG4                "x25"
#define TMP_REG4_               x25

#define TMP_REG5                "x24"
#define TMP_REG5_               x24

#define TMP_REG6                "x23"
#define TMP_REG6_               x23

// NOTE: x16 is used internally by some of the code in asm_snippets.h; avoid using it

/// Performance counter registers
#define PFC0 "x10"
#define PFC1 "x9"
#define PFC2 "x8"

#endif // _ARM64_REGISTERS_H_


================================================
FILE: rvzr/executor_km/arm64/special_registers.c
================================================
/// File:
///  - Management of model-specific registers (MSRs)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "special_registers.h"
#include "fault_handler.h"
#include "main.h"
#include "shortcuts.h"
#include "test_case_parser.h"

special_registers_t *orig_special_registers_state = NULL; // global

static int store_special_registers(void)
{
    ASSERT(orig_special_registers_state != NULL, "store_special_registers");
    memset(orig_special_registers_state, 0, sizeof(special_registers_t));

    // read_msr("SPSR_EL1", orig_special_registers_state->spsr_el1);
    // read_msr("SP_EL0", orig_special_registers_state->sp_el0);
    // read_msr("SP_EL1", orig_special_registers_state->sp_el1);
    // read_msr("ELR_EL1", orig_special_registers_state->elr_el1);
    return 0;
}

int set_special_registers(void)
{
    int err = store_special_registers();
    CHECK_ERR("set_special_registers");
    return err;
}

void restore_special_registers(void)
{
    // if (orig_special_registers_state->spsr_el1 != 0) {
    //     write_msr("SPSR_EL1", orig_special_registers_state->spsr_el1);
    // }
    // if (orig_special_registers_state->sp_el0 != 0) {
    //     write_msr("SP_EL0", orig_special_registers_state->sp_el0);
    // }
    // if (orig_special_registers_state->sp_el1 != 0) {
    //     write_msr("SP_EL1", orig_special_registers_state->sp_el1);
    // }
    // if (orig_special_registers_state->elr_el1 != 0) {
    //     write_msr("ELR_EL1", orig_special_registers_state->elr_el1);
    // }
    memset(orig_special_registers_state, 0, sizeof(special_registers_t));
}

// =================================================================================================
int init_special_register_manager(void)
{
    orig_special_registers_state = CHECKED_ZALLOC(sizeof(special_registers_t));
    return 0;
}

void free_special_register_manager(void) { SAFE_FREE(orig_special_registers_state); }


================================================
FILE: rvzr/executor_km/code_loader.c
================================================
/// File: Multiple variants of test case entry and exit points, for ARM64 architecture
///      used exclusively by code_loader.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "code_loader.h"
#include "macro_expansion.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

#include "fault_handler.h"

#ifdef ARCH_X86_64
#include "x86/entry_exit_points.h"
#elif defined(ARCH_ARM)
#include "arm64/entry_exit_points.h"
#endif

// =================================================================================================
// Local constants and declarations
// =================================================================================================

#define PER_SECTION_ALLOC_SIZE (MAX_EXPANDED_SECTION_SIZE + MAX_EXPANDED_MACROS_SIZE)
#define MAX_TEMPLATE_SIZE      0x1000 // for sanity checking

uint8_t *loaded_test_case_entry = NULL; // global

static int load_section_main(void);
static int load_section(uint64_t section_id);
static tc_symbol_entry_t *get_section_macros_start(uint64_t section_id);
static int expand_section(uint64_t section_id, uint8_t *dest, uint8_t *macros_dest,
                          size_t *size_section, size_t *size_macros);

// =================================================================================================
// Code Loader logic
// =================================================================================================
int load_sandbox_code(void)
{
    int err = 0;
    ASSERT(sandbox->code != NULL, "load_sandbox_code");

    // Re-initialize the code area with NOPs
    reset_code_area();

    // Load the code for each section
    for (int section_id = 0; section_id < n_actors; section_id++) {
        if (section_id == 0)
            err |= load_section_main();
        else
            err |= load_section(section_id);
    }
    return err;
}

static int load_section(uint64_t section_id)
{
    uint8_t *section = sandbox->code[section_id].section;
    uint8_t *macros = sandbox->code[section_id].macros;
    size_t size_section = 0, size_macros = 0;
    int err = expand_section(section_id, section, macros, &size_section, &size_macros);
    CHECK_ERR("load_section");

    return 0;
}

static int load_section_main(void)
{
    int err = 0;

    ASSERT(test_case->metadata[0].owner == 0, "load_section_main");
    uint8_t *dest = (uint8_t *)&sandbox->code[0].section;
    uint8_t *macro_dest = sandbox->code[0].macros;

    uint64_t src_cursor = 0;
    uint64_t dest_cursor = 0;
    uint64_t macros_cursor = 0;

    // reset globals
    fault_handler = NULL;
    loaded_test_case_entry = NULL;

    // select a template based on the debug mode
    uint8_t *src = (dbg_gpr_mode) ? (uint8_t *)main_segment_template_dbg_gpr
                                  : (uint8_t *)main_segment_template;

    // skip instructions inserted by the compiler and start at the TEMPLATE_START marker
    for (;; src_cursor++) {
        ASSERT(src_cursor < MAX_TEMPLATE_SIZE, "load_section_main; TEMPLATE_START");
        if (*(uint64_t *)&src[src_cursor] == TEMPLATE_START)
            break;
    }
    src_cursor += TEMPLATE_MARKER_SIZE;

    // copy the first part of the template
    for (;; src_cursor++, dest_cursor++) {
        ASSERT(src_cursor < MAX_TEMPLATE_SIZE, "load_section_main; TEMPLATE_INSERT_TC");
        if (*(uint64_t *)&src[src_cursor] == TEMPLATE_INSERT_TC)
            break;
        dest[dest_cursor] = src[src_cursor];
    }
    src_cursor += TEMPLATE_MARKER_SIZE;

    // notify Macro Loader about the prologue size of the main section
    set_main_prologue_size(dest_cursor);

    // copy the test case into the template and expand macros
    size_t size_section = 0, size_macros = 0;
    err = expand_section(0, &dest[dest_cursor], macro_dest, &size_section, &size_macros);
    CHECK_ERR("load_section_main");
    dest_cursor += size_section;
    macros_cursor += size_macros;

    // set fault handler if the test case does not already declare an explicit one
    for (;; src_cursor++, dest_cursor++) {
        ASSERT(src_cursor < MAX_TEMPLATE_SIZE, "load_section_main; EXCEPTION_LANDING");
        if (*(uint64_t *)&src[src_cursor] == TEMPLATE_DEFAULT_EXCEPTION_LANDING) {

            // if the test case has an explicit fault handler, we just skip the macro
            // and leave the 8 NOP bytes for compatibility
            if (test_case->features.has_explicit_fault_handler) {
                dest_cursor += MACRO_PLACEHOLDER_SIZE;
                break;
            }

            // set the fault handler to the default one (end of the main actor)
            fault_handler = (char *)&dest[dest_cursor];

            // expand the macro for the default fault handler
            tc_symbol_entry_t measurement_end = (tc_symbol_entry_t){
                .id = MACRO_FAULT_HANDLER_WITH_MEASUREMENT, .offset = 0, .owner = 0, .args = 0};
            size_macros = 0;
            err = expand_macro(&measurement_end, &dest[dest_cursor], &macro_dest[macros_cursor],
                               &size_macros);
            CHECK_ERR("load_section_main");

            macros_cursor += size_macros;
            dest_cursor += MACRO_PLACEHOLDER_SIZE;
            break;
        }
        dest[dest_cursor] = src[src_cursor];
    }
    src_cursor += TEMPLATE_MARKER_SIZE;

    // write the rest of the template
    for (;; src_cursor++, dest_cursor++) {
        ASSERT(src_cursor < MAX_TEMPLATE_SIZE, "load_section_main: TEMPLATE_END");
        if (*(uint64_t *)&src[src_cursor] == TEMPLATE_END)
            break;
        dest[dest_cursor] = src[src_cursor];
    }
    ASSERT(dest_cursor < MAX_EXPANDED_SECTION_SIZE, "load_section_main");

    loaded_test_case_entry = dest;
    return 0;
}

/// @brief Get the first macro in a section
/// @param section_id ID of the section
/// @return Pointer to the first macro in the section, or NULL if there are no macros
static tc_symbol_entry_t *get_section_macros_start(uint64_t section_id)
{
    tc_symbol_entry_t *entry = test_case->symbol_table;
    tc_symbol_entry_t *end = entry + (test_case->symbol_table_size / sizeof(*entry));
    while (entry->owner != section_id || entry->id == 0) {
        entry++;
        if (entry >= end)
            return NULL;
    }
    return entry;
}

/// @brief Expand a section and its macros into destination buffers
/// @param[in] section_id ID of the section to expand
/// @param[in] dest Destination address for the expanded section code
/// @param[in] macros_dest Destination address for the expanded macros
/// @param[out] size_section Size of the expanded section
/// @param[out] size_macros Size of the expanded macros
/// @return 0 on success, -1 on failure
static int expand_section(uint64_t section_id, uint8_t *dest, uint8_t *macros_dest,
                          size_t *size_section, size_t *size_macros)
{
    int err = 0;
    uint64_t src_cursor = 0;
    uint64_t dest_cursor = 0;
    uint64_t macros_cursor = 0;

    // get the unexpanded section
    uint8_t *section = test_case->sections[section_id].code;
    size_t section_size = test_case->metadata[section_id].size;
    ASSERT(section_size <= MAX_SECTION_SIZE, "expand_section");

    // get the first macro in the section
    tc_symbol_entry_t *macro = get_section_macros_start(section_id);

    // If there are no macros to expand, just copy the code
    if (macro == NULL) {
        memcpy(dest, section, section_size);
        *size_section = section_size;
        *size_macros = 0;
        return 0;
    }

    // Otherwise, expand macros by iterating over the section and calling expand_macro
    // whenever we encounter a macro placeholder
    for (src_cursor = 0; src_cursor < section_size; src_cursor++, dest_cursor++) {
        // if a byte is *not* a macro placeholder, just copy it
        if (macro == NULL || src_cursor != macro->offset) {
            dest[dest_cursor] = section[src_cursor];
            continue;
        }
        // PRINT_ERR("macro id: %d, macro owner: %d, macro args: %d, offset: %d\n", macro->id,
        //   macro->owner, macro->args, macro->offset);

        // if we're here, we have a macro placeholder
        ASSERT(macro->owner == section_id, "expand_section");
        ASSERT(macro->id != 0, "expand_section");

        // expand the macro into the destination buffers
        size_t macro_size = 0;
        err = expand_macro(macro, &dest[dest_cursor], &macros_dest[macros_cursor], &macro_size);
        CHECK_ERR("expand_section");

        // move the cursors
        src_cursor += MACRO_PLACEHOLDER_SIZE - 1;  // -1 because it will be incremented in the loop
        dest_cursor += MACRO_PLACEHOLDER_SIZE - 1; // -1 because it will be incremented in the loop
        macros_cursor += macro_size;
        macro++;

        // if we're done with macros in this section, set the macro pointer to NULL
        if (macro->owner != section_id)
            macro = NULL;
    }

    // ensure that we did not have an overrun
    ASSERT(src_cursor == section_size, "expand_section");

    *size_section = dest_cursor;
    *size_macros = macros_cursor;
    return 0;
}

// =================================================================================================
int init_code_loader(void)
{
    // NOTE: we assume the sandbox is already allocated by sandbox_manager
    return 0;
}

void free_code_loader(void) {}


================================================
FILE: rvzr/executor_km/data_loader.c
================================================
/// File:
///  - Parsing inputs and test cases
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "hardware_desc.h"

#include "actor.h"
#include "data_loader.h"
#include "input_parser.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

/// @brief This function serves a dual purpose:
/// - it initializes the data area of the sandbox with the values from the current input
/// - it (indirectly) sets the microarchitectural state of some of the memory buffers (e.g., the
///   store buffer) to a the state that depends on the current input; hence, we reduce the
///   non-determinism of the measurements
/// @param input_id
/// @return
int load_sandbox_data(int input_id)
{
    // NOTE: this function intentionally does not use memset (with a few exceptions), because
    // we found that direct initialization is more effective at priming the uarch state

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_data_t *dest = &sandbox->data[actor_id];
        input_fragment_t *source = get_input_fragment_unsafe(input_id, actor_id);

        // Zero-initialize the areas surrounding the sandbox
        if (!quick_and_dirty_mode) {
            memset(&dest->underflow_pad[0], 0, UNDERFLOW_PAD_SIZE * sizeof(char));
            for (int j = 0; j < OVERFLOW_PAD_SIZE / 8; j += 1) {
                // ((uint64_t *) sandbox->underflow_pad)[j] = 0;
                ((uint64_t *)dest->overflow_pad)[j] = 0;
            }
        }

        // Initialize the main and faulty areas of the sandbox data
        uint64_t *main_src = (uint64_t *)source->main_area;
        uint64_t *main_dest = (uint64_t *)dest->main_area;
        for (int j = 0; j < MAIN_AREA_SIZE / 8; j += 1) {
            main_dest[j] = main_src[j];
        }

        uint64_t *faulty_src = (uint64_t *)source->faulty_area;
        uint64_t *faulty_dest = (uint64_t *)dest->faulty_area;
        for (int j = 0; j < FAULTY_AREA_SIZE / 8; j += 1) {
            faulty_dest[j] = faulty_src[j];
        }

        // Initial register values
        // (the registers will be set to these values in code_loader template)
        uint64_t *reg_src = (uint64_t *)source->reg_init_region;
        uint64_t *reg_dest = (uint64_t *)dest->reg_init_area;
        for (int j = 0; j < REG_INIT_AREA_SIZE / 8; j += 1) {
            reg_dest[j] = reg_src[j];
        }

        // - Ensure that the flags are valid
#if defined(ARCH_X86_64)
        reg_dest[6] = (reg_src[6] & 2263) | 2;
#elif defined(ARCH_ARM)
        reg_dest[6] = (reg_src[6] << 28);
#endif

        // Note: RSP and RBP are do not take a value from the input,
        //       and are rather set to the stack base
    }

#if defined(ARCH_X86_64)
    // - Initialize SIMD registers
    // Note: GPRs will be initialized directly by the test case template; see code_loader.c
    uint64_t *simd_src = (uint64_t *)&get_input_fragment_unsafe(input_id, 0)->reg_init_region[64];
    asm volatile(""
                 "movq 0x00(%0), %%mm0\n"
                 "movq 0x08(%0), %%mm1\n"
                 "movq 0x10(%0), %%mm2\n"
                 "movq 0x18(%0), %%mm3\n"
                 "movq 0x20(%0), %%mm4\n"
                 "movq 0x28(%0), %%mm5\n"
                 "movq 0x30(%0), %%mm6\n"
                 "movq 0x38(%0), %%mm7\n"
                 // Note: overlap between YMM and MMX init values is intentional
                 "vmovdqa 0x00(%0), %%ymm0\n"
                 "vmovdqa 0x20(%0), %%ymm1\n"
                 "vmovdqa 0x40(%0), %%ymm2\n"
                 "vmovdqa 0x60(%0), %%ymm3\n"
                 "vmovdqa 0x80(%0), %%ymm4\n"
                 "vmovdqa 0xa0(%0), %%ymm5\n"
                 "vmovdqa 0xc0(%0), %%ymm6\n"
                 "vmovdqa 0xe0(%0), %%ymm7\n" ::"r"(&simd_src[0]));
#endif

    return 0;
}

// =================================================================================================
int init_data_loader(void) { return 0; }

void free_data_loader(void) {}


================================================
FILE: rvzr/executor_km/include/actor.h
================================================
/// File: Header describing actor metadata
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _ACTOR_H_
#define _ACTOR_H_

#include <linux/types.h>

#define MAX_ACTORS 16

typedef uint64_t actor_id_t;
typedef uint64_t actor_mode_t;
typedef uint64_t actor_pl_t;

enum {
    MODE_HOST = 0,
    MODE_GUEST = 1,
};

enum {
    PL_KERNEL = 0,
    PL_USER = 1,
};

typedef struct {
    actor_id_t id;
    actor_mode_t mode;
    actor_pl_t pl;
    uint64_t data_permissions;
    uint64_t data_ept_properties;
    uint64_t code_permissions;
} actor_metadata_t;

extern size_t n_actors;
extern actor_metadata_t *actors;

#endif // _ACTOR_H_


================================================
FILE: rvzr/executor_km/include/asm_snippets.h
================================================
/// File: Building blocks for creating macros;
///       This file re-directs to the correct architecture-specific file.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _ASM_SNIPPETS_H_
#define _ASM_SNIPPETS_H_

#include "hardware_desc.h"

#if defined(ARCH_X86_64)
#include "../x86/asm_snippets.h"
#elif defined(ARCH_ARM)
#include "../arm64/asm_snippets.h"
#endif

#endif // _ASM_SNIPPETS_H_

================================================
FILE: rvzr/executor_km/include/code_loader.h
================================================
/// File: Header for code_loader.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _CODE_LOADER_H_
#define _CODE_LOADER_H_

#include <linux/types.h>

extern uint8_t *loaded_test_case_entry;

int load_sandbox_code(void);

int init_code_loader(void);
void free_code_loader(void);

#endif // _CODE_LOADER_H_


================================================
FILE: rvzr/executor_km/include/data_loader.h
================================================
/// File: Header for data_loader.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _DATA_LOADER_H_
#define _DATA_LOADER_H_

#include <linux/types.h>

int load_sandbox_data(int input_id);

int init_data_loader(void);
void free_data_loader(void);

#endif // _DATA_LOADER_H_


================================================
FILE: rvzr/executor_km/include/fault_handler.h
================================================
/// File: Header for fault handling
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _FAULT_HANDLER_H_
#define _FAULT_HANDLER_H_

#include "hardware_desc.h"
#include <linux/interrupt.h>
#include <linux/version.h>

#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 10, 0)
struct idt_data {
    unsigned int vector;
    unsigned int segment;
    struct idt_bits bits;
    const void *addr;
};
#endif

#ifdef ARCH_X86_64

#include <../arch/x86/include/asm/traps.h>

// By default, we handle General Protection Fault and Page Fault
#define HANDLED_FAULTS_DEFAULT ((1 << X86_TRAP_GP) | (1 << X86_TRAP_PF))

#elif defined(ARCH_ARM)

// FIXME: exception handling is not implemented for ARM
#define HANDLED_FAULTS_DEFAULT 0

#endif

extern char *fault_handler;
extern uint32_t handled_faults;

// x86-only globals
extern struct desc_ptr test_case_idtr;

void set_outer_fault_handlers(void);
void unset_outer_fault_handlers(void);
void set_inner_fault_handlers(void);
void unset_inner_fault_handlers(void);

int init_fault_handler(void);
void free_fault_handler(void);

#endif // _FAULT_HANDLER_H_


================================================
FILE: rvzr/executor_km/include/hardware_desc.h
================================================
/// File: Header for hardware configuration
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _HARDWARE_DESC_H_
#define _HARDWARE_DESC_H_

#include <linux/types.h>

#ifndef VENDOR_ID
#error "Undefined VENDOR_ID"
#define VENDOR_ID 0
#endif

#if VENDOR_ID != 1 && VENDOR_ID != 2 && VENDOR_ID != 3
#error "Unsupported/corrupted VENDOR_ID"
#endif

#define VENDOR_INTEL_ 1
#define VENDOR_AMD_   2
#define VENDOR_ARM_   3
#undef VENDOR_INTEL
#undef VENDOR_AMD
#undef VENDOR_ARM

#if VENDOR_ID == VENDOR_INTEL_
#define ARCH_X86_64
#elif VENDOR_ID == VENDOR_AMD_
#define ARCH_X86_64
#elif VENDOR_ID == VENDOR_ARM_
#define ARCH_ARM
#endif

// =================================================================================================
// CPU identification
// =================================================================================================
#ifndef __ASSEMBLER__
#if defined(ARCH_X86_64)
typedef struct cpuinfo_x86 cpuinfo_t;
#elif defined(ARCH_ARM)
typedef struct {
    int implementer;
    int variant;
    int architecture;
    int part;
    int revision;
} cpuinfo_t;
#endif
#endif // __ASSEMBLER__

// =================================================================================================
// Memory configuration
// =================================================================================================
#ifndef PHYSICAL_WIDTH
#define PHYSICAL_WIDTH 51 // unused in the build; used only for syntax highlighting
#error "PHYSICAL_WIDTH must be defined by the makefile"
#endif

#define MAX_PHYSICAL_ADDRESS ((1ULL << PHYSICAL_WIDTH) - 1)

// =================================================================================================
// Cache configuration
// =================================================================================================
#ifndef L1D_ASSOCIATIVITY
#error "Undefined L1D_ASSOCIATIVITY"
#define L1D_ASSOCIATIVITY 0
#elif L1D_ASSOCIATIVITY != 12 && L1D_ASSOCIATIVITY != 8 && L1D_ASSOCIATIVITY != 4 &&               \
    L1D_ASSOCIATIVITY != 2
#warning "Unsupported/corrupted L1D associativity. Falling back to 8-way"
#define L1D_ASSOCIATIVITY 8
#endif

#ifndef L1D_SIZE_KB
#error "Undefined L1D_SIZE"
#define L1D_SIZE_KB 32 // unused in the build; used only for syntax highlighting
#else
#endif

#define L1D_CONFLICT_DISTANCE (L1D_SIZE_KB * 1024 / L1D_ASSOCIATIVITY)

// =================================================================================================
// Misc.
// =================================================================================================

// Definitions of MSRs missing in the kernel
#define MSR_SYSCFG 0xc0010010

#endif // _HARDWARE_DESC_H_


================================================
FILE: rvzr/executor_km/include/input_parser.h
================================================
/// File: Header for the input parser
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _INPUT_PARSER_H_
#define _INPUT_PARSER_H_

#include "sandbox_manager.h"

#define REG_INIT_AREA_SIZE_ALIGNED 4096

typedef uint64_t input_fragment_size_t;
typedef uint64_t input_fragment_reserved_field_t;

typedef struct {
    input_fragment_size_t size;
    input_fragment_reserved_field_t reserved;
} input_fragment_metadata_entry_t;

typedef struct {
    char main_area[MAIN_AREA_SIZE];
    char faulty_area[FAULTY_AREA_SIZE];
    char reg_init_region[REG_INIT_AREA_SIZE_ALIGNED];
} input_fragment_t;

typedef struct {
    size_t metadata_size;
    size_t data_size;
    input_fragment_metadata_entry_t *metadata;
    input_fragment_t *data;
} input_batch_t;

#define MAX_INPUTS            (1024 * 1024)
#define BATCH_HEADER_SIZE     16 // sizeof(n_actors) + sizeof(n_inputs)
#define FRAGMENT_SIZE_ALIGNED (MAIN_AREA_SIZE + FAULTY_AREA_SIZE + REG_INIT_AREA_SIZE_ALIGNED)

extern input_batch_t *inputs;
extern size_t n_inputs;

input_fragment_t *get_input_fragment(uint64_t input_id, uint64_t actor_id);
input_fragment_t *get_input_fragment_unsafe(uint64_t input_id, uint64_t actor_id);
ssize_t parse_input_buffer(const char *buf, size_t count, bool *finished);
bool input_parsing_completed(void);

int init_input_parser(void);
void free_input_parser(void);

#endif // _INPUT_PARSER_H_


================================================
FILE: rvzr/executor_km/include/macro_expansion.h
================================================
/// File: Header for test case macro loader
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _RVZR_MACRO_LOADER_H_
#define _RVZR_MACRO_LOADER_H_

#include "hardware_desc.h"

#include "asm_snippets.h"
#include "test_case_parser.h"
#include <linux/types.h>

// =================================================================================================
// Lists of possible macros
// =================================================================================================
typedef enum {
    NONMACRO_FUNCTION = 0,
    MACRO_MEASUREMENT_START = 1,
    MACRO_MEASUREMENT_END = 2,
    MACRO_FAULT_HANDLER = 3,
    MACRO_SWITCH = 4,
    MACRO_SET_K2U_TARGET = 5,
    MACRO_SWITCH_K2U = 6,
    MACRO_SET_U2K_TARGET = 7,
    MACRO_SWITCH_U2K = 8,
    MACRO_SET_H2G_TARGET = 9,
    MACRO_SWITCH_H2G = 10,
    MACRO_SET_G2H_TARGET = 11,
    MACRO_SWITCH_G2H = 12,
    MACRO_LANDING_K2U = 13,
    MACRO_LANDING_U2K = 14,
    MACRO_LANDING_H2G = 15,
    MACRO_LANDING_G2H = 16,
    MACRO_FAULT_HANDLER_WITH_MEASUREMENT = 17,
    MACRO_SET_DATA_PERMISSIONS = 18,
} macro_name_e;

typedef enum {
    TYPE_UNDEFINED,
    TYPE_PRIME,
    TYPE_FAST_PRIME,
    TYPE_PARTIAL_PRIME,
    TYPE_FAST_PARTIAL_PRIME,
    TYPE_PROBE,
    TYPE_FLUSH,
    TYPE_EVICT,
    TYPE_RELOAD,
    TYPE_TSC_START,
    TYPE_TSC_END,
    TYPE_FAULT_HANDLER,
    TYPE_FAULT_AND_PROBE,
    TYPE_FAULT_AND_RELOAD,
    TYPE_FAULT_AND_TSC_END,
    TYPE_SWITCH,
    TYPE_SET_K2U_TARGET,
    TYPE_SWITCH_K2U,
    TYPE_SET_U2K_TARGET,
    TYPE_SWITCH_U2K,
    TYPE_SET_H2G_TARGET,
    TYPE_SWITCH_H2G,
    TYPE_SET_G2H_TARGET,
    TYPE_SWITCH_G2H,
    TYPE_LANDING_K2U,
    TYPE_LANDING_U2K,
    TYPE_LANDING_H2G,
    TYPE_LANDING_G2H,
    TYPE_SET_DATA_PERMISSIONS,
} macro_subtype_e;

// =================================================================================================
// Macro descriptors
// =================================================================================================
// Arguments for a macro
typedef struct {
    uint16_t arg1;
    uint16_t arg2;
    uint16_t arg3;
    uint16_t arg4;
    uint64_t owner;
} macro_args_t;

// Descriptor of a macro
typedef struct {
    size_t (*start)(macro_args_t args, uint8_t *dest);
    void (*body)(void);
} macro_descr_t;

extern macro_descr_t macro_descriptors[];

// =================================================================================================
// Constants for parsing macro bodies
// =================================================================================================
// Code tokens
#define MACRO_START              0x0fff379000000000
#define MACRO_END                0x0fff2f9000000000
#define MACRO_START_TOKEN_LENGTH 8
#define MACRO_END_TOKEN_LENGTH   8

#if defined(ARCH_X86_64)
#define MACRO_PLACEHOLDER_SIZE 8
#elif defined(ARCH_ARM)
#define MACRO_PLACEHOLDER_SIZE 12
#endif

// =================================================================================================
// Public interface
// =================================================================================================
int expand_macro(tc_symbol_entry_t *macro, uint8_t *dest, uint8_t *macro_dest, size_t *macro_size);
void set_main_prologue_size(size_t size);
size_t get_main_prologue_size(void);

#endif // _RVZR_MACRO_LOADER_H_


================================================
FILE: rvzr/executor_km/include/main.h
================================================
/// File: Main Header
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _RVZR_EXECUTOR_MAIN_H_
#define _RVZR_EXECUTOR_MAIN_H_

#include <asm/cpu.h>
#include <linux/types.h>
#include <linux/version.h>

#include "hardware_desc.h"

typedef enum {
    PRIME_PROBE,
    PARTIAL_PRIME_PROBE,
    FAST_PRIME_PROBE,
    FAST_PARTIAL_PRIME_PROBE,
    FLUSH_RELOAD,
    EVICT_RELOAD,
    TSC,
} measurement_mode_e;

#define EXECUTOR_DEBUG 0

// Executor Configuration Interface
extern bool quick_and_dirty_mode;
extern measurement_mode_e measurement_mode;
#define MEASUREMENT_MODE_DEFAULT PRIME_PROBE
extern long uarch_reset_rounds;
#define UARCH_RESET_ROUNDS_DEFAULT 1
extern bool enable_ssbp_patch;
#define SSBP_PATCH_DEFAULT true
extern bool enable_prefetchers;
#define PREFETCHER_DEFAULT false
extern char pre_run_flush;
#define PRE_RUN_FLUSH_DEFAULT 1
extern bool enable_hpa_gpa_collisions;
#define HPA_GPA_COLLISIONS_DEFAULT false
extern bool dbg_gpr_mode;
#define DBG_GPR_MODE_DEFAULT false

// Linux Kernel compatibility
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 4, 0)
#include <linux/kallsyms.h>
extern int (*set_memory_x)(unsigned long, int);
extern int (*set_memory_nx)(unsigned long, int);
#else
#include <linux/set_memory.h>
#endif

extern cpuinfo_t *cpuinfo; // cached result of cpu_data for CPU 0

#endif // _RVZR_EXECUTOR_MAIN_H_


================================================
FILE: rvzr/executor_km/include/measurement.h
================================================
/// File: Header for the measurement manager
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _MEASUREMENT_H_
#define _MEASUREMENT_H_

#include <linux/types.h>
#include <linux/version.h>

#define HTRACE_WIDTH 1
#define NUM_PFC      5

#define STATUS_UNINITIALIZED 0
#define STATUS_STARTED       1
#define STATUS_ENDED         2

typedef struct measurement_status {
    uint8_t measurement_state;
    uint8_t reserved[3];
    uint32_t smi_count;
} __attribute__((packed)) measurement_status_t;

typedef struct Measurement {
    uint64_t htrace[HTRACE_WIDTH];
    uint64_t pfc_reading[NUM_PFC];
    measurement_status_t status;
} __attribute__((packed)) measurement_t;

extern measurement_t *measurements;

int trace_test_case(void);
int run_experiment(void);

void recover_orig_state(void);

int alloc_measurements(void);
int init_measurements(void);
void free_measurements(void);

#endif // _MEASUREMENT_H_


================================================
FILE: rvzr/executor_km/include/page_tables_common.h
================================================
/// File: Dispatch header that includes the correct page tables definitions for the architecture
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _PAGE_TABLES_COMMON_H_
#define _PAGE_TABLES_COMMON_H_

#include "hardware_desc.h"
#include <linux/slab.h> // PAGE_SIZE
#include <linux/types.h>

#define ENTRIES_PER_PAGE (PAGE_SIZE / sizeof(uint64_t))

// =================================================================================================
// X86
// =================================================================================================
#if defined(ARCH_X86_64)

#define MODIFIABLE_PTE_BITS                                                                        \
    (_PAGE_PRESENT | _PAGE_RW | _PAGE_PWT | _PAGE_PCD | _PAGE_ACCESSED | _PAGE_DIRTY |             \
     _PAGE_PKEY_BIT0 | _PAGE_PKEY_BIT1 | _PAGE_PKEY_BIT2 | _PAGE_PKEY_BIT3 | _PAGE_NX |            \
     (1ULL << 51))

#define _E_PAGE_PRESENT  (1 << 0)
#define _E_PAGE_RW       (1 << 1)
#define _E_PAGE_X        (1 << 2)
#define _E_PAGE_ACCESSED (1 << 8)
#define _E_PAGE_DIRTY    (1 << 9)
#define _E_PAGE_USER     (1 << 10)

#if VENDOR_ID == VENDOR_INTEL_ // Intel
#define MODIFIABLE_EPTE_BITS                                                                       \
    (_E_PAGE_PRESENT | _E_PAGE_RW | _E_PAGE_X | _E_PAGE_ACCESSED | _E_PAGE_DIRTY | _E_PAGE_USER |  \
     (1ULL << 51))
#else
#define MODIFIABLE_EPTE_BITS MODIFIABLE_PTE_BITS
#endif

// -------------------------------------------------------------------------------------------------
// Normal page tables
// -------------------------------------------------------------------------------------------------
#define PML4_SHIFT     39
#define PDPT_SHIFT     30
#define PDT_SHIFT      21
#define PT_SHIFT       12
#define MAX_VADDR_BITS 48

#define PML4_INDEX(vaddr) (((uint64_t)(vaddr) >> PML4_SHIFT) & 0x1FF)
#define PDPT_INDEX(vaddr) (((uint64_t)(vaddr) >> PDPT_SHIFT) & 0x1FF)
#define PDT_INDEX(vaddr)  (((uint64_t)(vaddr) >> PDT_SHIFT) & 0x1FF)
#define PT_INDEX(vaddr)   (((uint64_t)(vaddr) >> PT_SHIFT) & 0x1FF)

// Table 4-15. Format of a PML4 Entry (PML4E) that References a Page-Directory-Pointer Table
typedef struct {
    uint64_t present : 1;
    uint64_t write_access : 1;
    uint64_t user_supervisor : 1;
    uint64_t page_write_through : 1;
    uint64_t page_cache_disable : 1;
    uint64_t accessed : 1;
    uint64_t ignored : 1;
    uint64_t reserved_zero : 1;
    uint64_t ignored_11_8 : 4;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_62_52 : 11;
    uint64_t execute_disable : 1;
} __attribute__((packed)) pml4e_t;

// Table 4-17. Format of a Page-Directory-Pointer-Table Entry (PDPTE) that
// References a Page Directory
typedef struct {
    uint64_t present : 1;
    uint64_t write_access : 1;
    uint64_t user_supervisor : 1;
    uint64_t page_write_through : 1;
    uint64_t page_cache_disable : 1;
    uint64_t accessed : 1;
    uint64_t ignored : 1;
    uint64_t reserved_zero : 1;
    uint64_t ignored_11_8 : 4;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_62_52 : 11;
    uint64_t execute_disable : 1;
} __attribute__((packed)) pdpte_t;

// Table 4-19. Format of a Page-Directory Entry that References a Page Table
typedef struct {
    uint64_t present : 1;
    uint64_t write_access : 1;
    uint64_t user_supervisor : 1;
    uint64_t page_write_through : 1;
    uint64_t page_cache_disable : 1;
    uint64_t accessed : 1;
    uint64_t ignored : 1;
    uint64_t reserved_zero : 1;
    uint64_t ignored_11_8 : 4;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_62_52 : 11;
    uint64_t execute_disable : 1;
} __attribute__((packed)) pdte_t;

// Table 4-20. Format of a Page-Table Entry that Maps a 4-KByte Page
typedef struct {
    uint64_t present : 1;
    uint64_t write_access : 1;
    uint64_t user_supervisor : 1;
    uint64_t page_write_through : 1;
    uint64_t page_cache_disable : 1;
    uint64_t accessed : 1;
    uint64_t dirty : 1;
    uint64_t page_attribute_table : 1;
    uint64_t global_page : 1;
    uint64_t ignored_11_9 : 3;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_58_52 : 7;
    uint64_t protection_key : 4;
    uint64_t execute_disable : 1;
} __attribute__((packed)) pte_t_; // using pte_t_ as pte_t is already defined in linux/types.h

// -------------------------------------------------------------------------------------------------
// Extended page tables
// -------------------------------------------------------------------------------------------------

// Figure 29-1. Formats of EPTP and EPT Paging-Structure Entries
typedef struct {
    uint64_t memory_type : 3;
    uint64_t page_walk_length : 3;
    uint64_t ad_enabled : 1;
    uint64_t superv_sdw_stack : 1;
    uint64_t reserved_11_08 : 4;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t reserved_63_52 : 12;
} __attribute__((packed)) eptp_t;

#if VENDOR_ID == 1 // Intel
// Table 28-1. Format of an EPT PML4E
typedef struct {
    uint64_t read_access : 1;
    uint64_t write_access : 1;
    uint64_t execute_access : 1;
    uint64_t reserved_7_3 : 5;
    uint64_t accessed : 1;
    uint64_t ignored_9 : 1;
    uint64_t user_ex_access : 1;
    uint64_t ignored_11 : 1;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_63_52 : 12;
} __attribute__((packed)) epml4e_t;
#else
typedef pml4e_t epml4e_t;
#endif

#if VENDOR_ID == 1 // Intel
// Table 28-3. Format of an EPT Page-Directory-Pointer-Table Entry (EPT PDPTE)
typedef struct {
    uint64_t read_access : 1;
    uint64_t write_access : 1;
    uint64_t execute_access : 1;
    uint64_t reserved_6_3 : 4;
    uint64_t reserved_7 : 1;
    uint64_t accessed : 1;
    uint64_t ignored_9 : 1;
    uint64_t user_ex_access : 1;
    uint64_t ignored_11 : 1;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_63_52 : 12;
} __attribute__((packed)) epdpte_t;
#else
typedef pdpte_t epdpte_t;
#endif

#if VENDOR_ID == 1 // Intel
typedef struct {
    uint64_t read_access : 1;
    uint64_t write_access : 1;
    uint64_t execute_access : 1;
    uint64_t reserved_6_3 : 4;
    uint64_t reserved_7 : 1;
    uint64_t accessed : 1;
    uint64_t ignored_9 : 1;
    uint64_t user_ex_access : 1;
    uint64_t ignored_11 : 1;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_63_52 : 12;
} __attribute__((packed)) epdte_t;
#else
typedef pdte_t epdte_t;
#endif

#if VENDOR_ID == 1 // Intel
typedef struct {
    uint64_t read_access : 1;
    uint64_t write_access : 1;
    uint64_t execute_access : 1;
    uint64_t ept_mem_type : 3;
    uint64_t ignore_pat : 1;
    uint64_t ignored_7 : 1;
    uint64_t accessed : 1;
    uint64_t dirty : 1;
    uint64_t user_ex_access : 1;
    uint64_t ignored_11 : 1;
    uint64_t paddr : (PHYSICAL_WIDTH - 12);
#if PHYSICAL_WIDTH < 52
    uint64_t reserved_51_M : (52 - PHYSICAL_WIDTH);
#endif
    uint64_t ignored_56_52 : 5;
    uint64_t verif_guest_pag : 1;
    uint64_t pag_write_access : 1;
    uint64_t ignored_59 : 1;
    uint64_t superv_sdw_stack : 1;
    uint64_t subpg_write_perm : 1;
    uint64_t ignored_62 : 1;
    uint64_t suppress_ve : 1;
} __attribute__((packed)) epte_t_;
#else
typedef pte_t_ epte_t_;
#endif

static inline void set_user_bit(pte_t_ *pte) { pte->user_supervisor = 1; }

// =================================================================================================
// ARM
// =================================================================================================
#elif defined(ARCH_ARM)

// NOTE: All definitions below assume 4KB pages
//
// NOTE: The formats are described in the ARMv8-A Architecture Reference Manual
//       see D8.3.1 VMSAv8-64 descriptor formats

#define MODIFIABLE_PTE_BITS (PTE_VALID | PTE_USER | PTE_RDONLY)

typedef struct {
    uint64_t valid : 1;
    uint64_t type : 1;
    uint64_t ignored_2_7 : 6;
    uint64_t nlta_high : 2;
    uint64_t access_flag : 1;
    uint64_t ignored_11 : 1;
    uint64_t nlta_low : 38;
    uint64_t reserved_50 : 1;
    uint64_t ignored_51_58 : 8;
    uint64_t pxn_table : 1;
    uint64_t uxn_table : 1;
    uint64_t ap_table : 2;
    uint64_t ns_table : 1;
} __attribute__((packed)) l1_descr_t;

typedef struct {
    uint64_t valid : 1;
    uint64_t type : 1;
    uint64_t ignored_2_7 : 6;
    uint64_t nlta_high : 2;
    uint64_t access_flag : 1;
    uint64_t ignored_11 : 1;
    uint64_t nlta_low : 38;
    uint64_t reserved_50 : 1;
    uint64_t ignored_51_58 : 8;
    uint64_t reserved_59_63 : 5;
} __attribute__((packed)) l2_descr_t;

typedef struct {
    uint64_t valid : 1;
    uint64_t type : 1;
    uint64_t attr_index : 3;
    uint64_t non_secure : 1;
    uint64_t access_permissions : 2;
    uint64_t shareability : 2;
    uint64_t access_flag : 1;
    uint64_t not_global : 1;
    uint64_t paddr : 38;
    uint64_t guarded : 1;
    uint64_t dirty : 1;
    uint64_t contiguous : 1;
    uint64_t privileged_execute_never : 1;
    uint64_t execute_never : 1;
    uint64_t reserved_58_55 : 4;
    uint64_t ignored_63_59 : 5;
} __attribute__((packed)) l3_descr_t;

static inline void set_user_bit(l3_descr_t *pte)
{
    // pte->user_supervisor = 1;  // TODO
}

typedef l3_descr_t pte_t_;

#endif // ARCH_X86_64

#endif // _PAGE_TABLES_COMMON_H_


================================================
FILE: rvzr/executor_km/include/page_tables_guest.h
================================================
/// File: Dispatch header that includes the guest page table definitions for the architecture
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _GUEST_PAGE_TABLES_H_
#define _GUEST_PAGE_TABLES_H_

#include "hardware_desc.h"
#include "page_tables_common.h"
#include "sandbox_manager.h"

// =================================================================================================
// Memory layout
// =================================================================================================

// start of guest's physical memory; this is an arbitrary large aligned number
#define GUEST_P_MEMORY_START 0
#define GUEST_V_MEMORY_START 0x0ULL
#define GUEST_MEMORY_SIZE    (512 * 4096) // max size that could be mapped by a single last-level PT

// =================================================================================================
// Extended page tables
// =================================================================================================
#if defined(ARCH_X86_64)

// Kernel Constant Compatibility
#ifndef VMX_BASIC_MEM_TYPE_WB
#define VMX_BASIC_MEM_TYPE_WB 6LLU
#endif

// Memory layout within the guest memory
typedef struct {
    pte_t_ l1[ENTRIES_PER_PAGE];  // PT
    pdte_t l2[ENTRIES_PER_PAGE];  // PDT
    pdpte_t l3[ENTRIES_PER_PAGE]; // PDPT
    pml4e_t l4[ENTRIES_PER_PAGE]; // PML4
} actor_page_table_t;

typedef struct {
    epte_t_ l1[ENTRIES_PER_PAGE];  // EPT PT
    epdte_t l2[ENTRIES_PER_PAGE];  // EPT PDT
    epdpte_t l3[ENTRIES_PER_PAGE]; // EPT PDPT
    epml4e_t l4[ENTRIES_PER_PAGE]; // EPT PML4
} actor_ept_t;

typedef struct {
    uint8_t entries[PAGE_SIZE];
} __attribute__((packed)) actor_gdt_t;

// Guest memory layout; it is identical for both physical and virtual memory
typedef struct {
    util_t util;
    actor_data_t data;
    actor_code_t code;
    uint8_t vmlaunch_page[PAGE_SIZE];
    actor_gdt_t gdt;
    actor_page_table_t guest_page_tables;
} __attribute__((packed)) guest_memory_t;

// Translation from virtual to guest and host physical addresses
typedef struct {
    uint64_t hpa;
    uint64_t gpa;
    void *gva;
    void *hva;
} __attribute__((packed)) hgpa_t;

// Specialized translation data structure to speed up virtual-to-physical translations
typedef struct {
    hgpa_t util[sizeof(util_t) / PAGE_SIZE];
    hgpa_t data[sizeof(actor_data_t) / PAGE_SIZE];
    hgpa_t code[sizeof(actor_code_t) / PAGE_SIZE];
    hgpa_t vmlaunch_page[1];
    hgpa_t gdt[1];
    hgpa_t guest_page_tables[4];
} __attribute__((packed)) guest_memory_translations_t;

extern eptp_t *ept_ptr;

#elif defined(ARCH_ARM)

// nothing here yet

#endif // ARCH_ARM

// =================================================================================================
// Public interfaces
// =================================================================================================
int dbg_dump_guest_page_tables(int actor_id);
int dbg_dump_ept(int actor_id);

int map_sandbox_to_guest_memory(void);

void set_faulty_page_guest_permissions(void);
void restore_faulty_page_guest_permissions(void);

void set_faulty_page_ept_permissions(void);
void restore_faulty_page_ept_permissions(void);

int allocate_guest_page_tables(void);
void free_guest_page_tables(void);

#endif // _GUEST_PAGE_TABLES_H_


================================================
FILE: rvzr/executor_km/include/page_tables_host.h
================================================
/// File: Header for page table functions
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _PAGE_TABLE_H_
#define _PAGE_TABLE_H_

#include "page_tables_common.h"
#include <linux/kernel.h>

typedef struct {
    pte_t_ *data_ptes;
    pte_t_ *code_ptes;
    pte_t_ *util_ptes;
} sandbox_ptes_t;

typedef struct {
    pte_t_ **data_pteps;
    pte_t_ **code_pteps;
    pte_t_ **util_pteps;
} sandbox_pteps_t;

extern sandbox_pteps_t *sandbox_pteps;

pte_t *get_pte(uint64_t hva);

int cache_host_pteps(void);
int store_orig_host_permissions(void);
int restore_orig_host_permissions(void);

int set_user_pages(void);
void set_faulty_page_host_permissions(void);
void restore_faulty_page_host_permissions(void);

int init_page_table_manager(void);
void free_page_table_manager(void);

#endif // _PAGE_TABLE_H_


================================================
FILE: rvzr/executor_km/include/perf_counters.h
================================================
/// File: Header for perf_counters.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _PERF_COUNTERS_H_
#define _PERF_COUNTERS_H_

int pfc_configure(void);

int init_perf_counters(void);
void free_perf_counters(void);

#endif // _PERF_COUNTERS_H_


================================================
FILE: rvzr/executor_km/include/sandbox_constants.h
================================================
/// File: Collection of constants that define the layout of the sandbox;
///       This file is intentionally separate from sandbox_manager.h so that
///       it can be included in assembly files as well.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _SANDBOX_CONSTANTS_H_
#define _SANDBOX_CONSTANTS_H_

#include "hardware_desc.h"

#define SIZE_UINT64 (8)

// layout of util_t
#define UTIL_VARS_MAX         4096
#define L1D_PRIMING_AREA_SIZE (L1D_SIZE_KB * 1024ULL)
#define STORED_RSP_SIZE       SIZE_UINT64
#define MEASUREMENT_SIZE      56ULL // see measurement.h
#define NESTED_FAULT_SIZE     SIZE_UINT64

// layout of actor_data_t
#define MACRO_STACK_SIZE   64
#define UNDERFLOW_PAD_SIZE (4096 - MACRO_STACK_SIZE)
#define MAIN_AREA_SIZE     4096
#define FAULTY_AREA_SIZE   4096
#define REG_INIT_AREA_SIZE 320 // 8 64-bit GPRs + 8 256-bit YMMs
#define OVERFLOW_PAD_SIZE  (4096 - REG_INIT_AREA_SIZE)

// Section sizes
#define MAX_EXPANDED_SECTION_SIZE (0x1000ULL * 2)
#define MAX_EXPANDED_MACROS_SIZE  (0x1000ULL)

// offsets w.r.t. the base of util_t (r15 will be initialized to point there)
#define L1D_PRIMING_OFFSET (0)
#define UTIL_VARS_OFFSET   (L1D_PRIMING_OFFSET + L1D_PRIMING_AREA_SIZE)
#define STORED_RSP_OFFSET  (UTIL_VARS_OFFSET + 0)
#define MEASUREMENT_OFFSET (STORED_RSP_OFFSET + STORED_RSP_SIZE)
#define UNUSED1_OFFSET     (MEASUREMENT_OFFSET + MEASUREMENT_SIZE)
#define K2U_TARGET_OFFSET  (UNUSED1_OFFSET + NESTED_FAULT_SIZE)
#define U2K_TARGET_OFFSET  (K2U_TARGET_OFFSET + SIZE_UINT64)

// offsets of util_t w.r.t. the base of main_area of the main actor
#define UTIL_REL_TO_MAIN                                                                           \
    (L1D_PRIMING_AREA_SIZE + UTIL_VARS_MAX + UNDERFLOW_PAD_SIZE + MACRO_STACK_SIZE)

// offsets w.r.t. the base of main_area of the current actor (r14 will contain the base)
#define MACRO_STACK_TOP_OFFSET (UNDERFLOW_PAD_SIZE)
#define MAIN_AREA_OFFSET       (0)
#define FAULTY_AREA_OFFSET     (MAIN_AREA_SIZE)
#define REG_INIT_OFFSET        (FAULTY_AREA_OFFSET + FAULTY_AREA_SIZE)
#define OVERFLOW_PAD_OFFSET    (REG_INIT_OFFSET + REG_INIT_AREA_SIZE)
#define LOCAL_RSP_OFFSET       (FAULTY_AREA_OFFSET - 8)

// area page IDs
#define MAIN_PAGE_ID   ((MACRO_STACK_SIZE + UNDERFLOW_PAD_SIZE) / 4096)
#define FAULTY_PAGE_ID ((MACRO_STACK_SIZE + UNDERFLOW_PAD_SIZE + MAIN_AREA_SIZE) / 4096)

// number of pages for each component
#define N_UTIL_PAGES           (sizeof(util_t) / 4096)
#define N_DATA_PAGES_PER_ACTOR (sizeof(actor_data_t) / 4096)
#define N_CODE_PAGES_PER_ACTOR (sizeof(actor_code_t) / 4096)

#endif // _SANDBOX_CONSTANTS_H_


================================================
FILE: rvzr/executor_km/include/sandbox_manager.h
================================================
/// File: Header for sandbox management
///       See docs/sandbox.md for the description of the sandboxing mechanism.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _SANDBOX_MANAGER_H_
#define _SANDBOX_MANAGER_H_

#include <linux/types.h>

#include "sandbox_constants.h"

#include "hardware_desc.h" // L1D_ASSOCIATIVITY
#include "measurement.h"   // measurement_t

// =================================================================================================
// Sandbox data layout
// =================================================================================================
/// @brief Area with test-case global variables that are used to communicate with the executor
///        and store intermediate results
typedef struct {
    uint64_t stored_rsp;              // stores the stack pointer before calling the test case
    measurement_t latest_measurement; // measurement results
    uint64_t unused1;
#ifdef ARCH_X86_64
    uint8_t unused[UTIL_VARS_MAX - sizeof(measurement_t) - (2 * sizeof(uint64_t))];
#elif defined(ARCH_ARM)
    uint64_t k2u_target_address; // target address for k2u switches
    uint64_t u2k_target_address; // target address for u2k switches
    uint8_t unused[UTIL_VARS_MAX - sizeof(measurement_t) - (4 * sizeof(uint64_t))];
#endif // ARCH_ARM
} util_vars_t;

/// @brief Utility data structure used by various primitives in the test case.
///        Must be allocated strictly before the main actor data as its code accesses
///        fields of util_t by using constant offsets from the base of its main_area.
typedef struct {
    uint8_t l1d_priming_area[L1D_PRIMING_AREA_SIZE];
    util_vars_t vars;
} __attribute__((packed)) util_t;

/// @brief Data structure representing the memory accessible by the actor's code
typedef struct {
    uint8_t macro_stack[MACRO_STACK_SIZE];     // stack for storing registers when calling macros
    uint8_t underflow_pad[UNDERFLOW_PAD_SIZE]; // zero-initialized region for accidental underflows
    uint8_t main_area[MAIN_AREA_SIZE];         // first input page; does not cause faults
    uint8_t faulty_area[FAULTY_AREA_SIZE];     // second input page; causes a (configurable) fault
    uint8_t reg_init_area[REG_INIT_AREA_SIZE]; // region for initializing registers
    uint8_t overflow_pad[OVERFLOW_PAD_SIZE];   // zero-initialized region for accidental overflows
} __attribute__((packed)) actor_data_t;

// =================================================================================================
// Sandbox code layout
// =================================================================================================
typedef struct {
    uint8_t section[MAX_EXPANDED_SECTION_SIZE];
    uint8_t macros[MAX_EXPANDED_MACROS_SIZE];
} __attribute__((packed)) actor_code_t;

// =================================================================================================
// sandbox_t
// =================================================================================================
typedef struct {
    actor_data_t *data;
    actor_code_t *code;
    util_t *util;
} sandbox_t;

// =================================================================================================
// Sandbox manager interface
// =================================================================================================
extern sandbox_t *sandbox;

int get_sandbox_size_pages(void);

int set_sandbox_page_tables(void);
void restore_orig_sandbox_page_tables(void);

void set_faulty_page_permissions(void);
void restore_faulty_page_permissions(void);

int allocate_sandbox(void);
void reset_code_area(void);

int init_sandbox_manager(void);
void free_sandbox_manager(void);

#endif // _SANDBOX_MANAGER_H_


================================================
FILE: rvzr/executor_km/include/shortcuts.h
================================================
/// File: Header for common macros
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef KM_SHORTCUTS_H
#define KM_SHORTCUTS_H

#include "hardware_desc.h"
#include <asm/io.h>
#include <linux/kernel.h>
#include <linux/mm.h>
#include <linux/slab.h>    // kfree, kmalloc
#include <linux/vmalloc.h> // vfree, vmalloc

#ifdef ARCH_X86_64
#include <../arch/x86/include/asm/desc.h>
#endif

// =================================================================================================
// Strings and assembly
// =================================================================================================
#define STRINGIFY(...) #__VA_ARGS__

#define xstr(s) _str(s)
#define _str(s) str(s)
#define str(s)  #s

// clang-format off
#define asm_volatile_intel(ASM)                                                                    \
    asm volatile("\n.intel_syntax noprefix\n"                                                      \
                    ASM                                                                            \
                 ".att_syntax noprefix\n")
// clang-format on

// =================================================================================================
// MSR access
// =================================================================================================
#ifdef ARCH_X86_64
// Kernel 6.16+ changed native_write_msr signature from (msr, low, high) to (msr, val)
#include <linux/version.h>
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 16, 0)
#define wrmsr64(msr, value) native_write_msr(msr, value)
#else
#define wrmsr64(msr, value) native_write_msr(msr, (uint32_t)(value), (uint32_t)((value) >> 32))
#endif
#define rdmsr64(msr) native_read_msr(msr)
#elif defined(ARCH_ARM)
#define write_msr(NAME, VALUE) asm volatile("msr " NAME ", %0\n isb\n" ::"r"(VALUE));
#define read_msr(NAME, VAR)    asm volatile("mrs %0, " NAME "\n isb\n" : "=r"(VAR));
#endif

// =================================================================================================
// Bit manipulation
// =================================================================================================
#define BIT_(x) (1ULL << (x))

// =================================================================================================
// Logging and error handling
// =================================================================================================
#define PRINT_ERR(msg, ...)                                                                        \
    do {                                                                                           \
        printk(KERN_ERR "[rvzr_executor] " msg, ##__VA_ARGS__);                                    \
    } while (0)
#define PRINT_ERRS(src, msg, ...)                                                                  \
    do {                                                                                           \
        printk(KERN_ERR "[rvzr_executor:" src "] " msg, ##__VA_ARGS__);                            \
    } while (0)

#define PRINT_WARN(msg, ...) printk(KERN_WARNING "[rvzr_executor] " msg, ##__VA_ARGS__);
#define PRINT_WARNS(src, msg, ...)                                                                 \
    printk(KERN_WARNING "[rvzr_executor:" src "] " msg, ##__VA_ARGS__);

#define ASSERT(condition, src)                                                                     \
    if (!(condition)) {                                                                            \
        PRINT_ERRS(src, "Assertion failed: " xstr(condition) "\n");                                \
        return -EIO;                                                                               \
    }

#define ASSERT_MSG(condition, src, msg, ...)                                                       \
    if (!(condition)) {                                                                            \
        PRINT_ERRS(src, "Assertion failed: " xstr(condition) ";\n" msg, ##__VA_ARGS__);            \
        return -EIO;                                                                               \
    }

#define ASSERT_ENULL(condition, src)                                                               \
    if (!(condition)) {                                                                            \
        PRINT_ERRS(src, "Assertion failed: " xstr(condition) "\n");                                \
        return NULL;                                                                               \
    }

#define ASSERT_MSG_ENULL(condition, src, ...)                                                      \
    if (!(condition)) {                                                                            \
        PRINT_ERRS(src, "Assertion failed: " xstr(condition) ";" msg, ##__VA_ARGS__);              \
        return NULL;                                                                               \
    }

#define CHECK_ERR(msg)                                                                             \
    if (err) {                                                                                     \
        PRINT_ERR(" Error [" msg "]\n");                                                           \
        return -EIO;                                                                               \
    }

#define UNIMPLEMENTED(src)                                                                         \
    PRINT_ERRS(src, "Unimplemented\n");                                                            \
    return -ENOSYS;

// =================================================================================================
// Memory management
// =================================================================================================
// NOLINTBEGIN(bugprone-macro-parentheses)

#define CHECKED_MALLOC(x)                                                                          \
    ({                                                                                             \
        void *ptr = kmalloc(x, GFP_KERNEL);                                                        \
        if (!ptr) {                                                                                \
            PRINT_ERR(" Error allocating memory\n");                                               \
            return -ENOMEM;                                                                        \
        }                                                                                          \
        ptr;                                                                                       \
    })
#define CHECKED_ZALLOC(x)                                                                          \
    ({                                                                                             \
        void *ptr = kzalloc(x, GFP_KERNEL);                                                        \
        if (!ptr) {                                                                                \
            PRINT_ERR(" Error zero-allocating memory\n");                                          \
            return -ENOMEM;                                                                        \
        }                                                                                          \
        ptr;                                                                                       \
    })
#define SAFE_FREE(x)                                                                               \
    if (x) {                                                                                       \
        kfree(x);                                                                                  \
        x = NULL;                                                                                  \
    }

#define CHECKED_VMALLOC(x)                                                                         \
    ({                                                                                             \
        void *ptr = vmalloc(x);                                                                    \
        if (!ptr) {                                                                                \
            PRINT_ERR(" Error allocating memory\n");                                               \
            return -ENOMEM;                                                                        \
        }                                                                                          \
        ptr;                                                                                       \
    })
#define SAFE_VFREE(x)                                                                              \
    if (x) {                                                                                       \
        vfree(x);                                                                                  \
        x = NULL;                                                                                  \
    }

#define CHECKED_ALLOC_PAGES(size)                                                                  \
    ({                                                                                             \
        struct page *ptr = alloc_pages(GFP_KERNEL, get_order(size));                               \
        if (!ptr) {                                                                                \
            PRINT_ERR(" Error allocating pages\n");                                                \
            return -ENOMEM;                                                                        \
        }                                                                                          \
        ptr;                                                                                       \
    })

#define SAFE_PAGES_FREE(x, size)                                                                   \
    if (x) {                                                                                       \
        __free_pages(x, get_order(size));                                                          \
        x = NULL;                                                                                  \
    }

// NOLINTEND(bugprone-macro-parentheses)

// =================================================================================================
// Call sequences
// =================================================================================================
#define CALL_16_TIMES(macro, arg, id)                                                              \
    macro(arg, id##0) macro(arg, id##1) macro(arg, id##2) macro(arg, id##3) macro(arg, id##4)      \
        macro(arg, id##5) macro(arg, id##6) macro(arg, id##7) macro(arg, id##8) macro(arg, id##9)  \
            macro(arg, id##a) macro(arg, id##b) macro(arg, id##c) macro(arg, id##d)                \
                macro(arg, id##e) macro(arg, id##f)
#define CALL_256_TIMES(macro, arg)                                                                 \
    CALL_16_TIMES(macro, arg, 0)                                                                   \
    CALL_16_TIMES(macro, arg, 1)                                                                   \
    CALL_16_TIMES(macro, arg, 2)                                                                   \
    CALL_16_TIMES(macro, arg, 3)                                                                   \
    CALL_16_TIMES(macro, arg, 4)                                                                   \
    CALL_16_TIMES(macro, arg, 5)                                                                   \
    CALL_16_TIMES(macro, arg, 6)                                                                   \
    CALL_16_TIMES(macro, arg, 7)                                                                   \
    CALL_16_TIMES(macro, arg, 8)                                                                   \
    CALL_16_TIMES(macro, arg, 9)                                                                   \
    CALL_16_TIMES(macro, arg, a)                                                                   \
    CALL_16_TIMES(macro, arg, b)                                                                   \
    CALL_16_TIMES(macro, arg, c)                                                                   \
    CALL_16_TIMES(macro, arg, d)                                                                   \
    CALL_16_TIMES(macro, arg, e)                                                                   \
    CALL_16_TIMES(macro, arg, f)

// =================================================================================================
// Address translation
// =================================================================================================

static inline uint64_t vmalloc_to_phys(void *hva)
{
    struct page *page = vmalloc_to_page(hva);
    if (!page)
        return 0;
    uint64_t hpa = page_to_phys(page);
    return hpa;
}

static inline void native_page_invalidate(uint64_t hva)
{
#ifdef ARCH_X86_64
    asm volatile("invlpg (%0)" ::"r"(hva) : "memory");
#elif defined(ARCH_ARM)
    hva >>= 12;
    hva &= 0xfffffffffffULL;
    asm volatile("dsb ishst\n tlbi vale1is, %0\n dsb ish\n" ::"r"(hva) : "memory");
#endif
}

#endif // KM_SHORTCUTS_H


================================================
FILE: rvzr/executor_km/include/special_registers.h
================================================
/// File: Header for msr.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _MSR_H_
#define _MSR_H_

#include <linux/types.h>
#include "hardware_desc.h"

/// @brief Structure to hold the state of special registers (MSRs and other system registers)
///        that need to be preserved by the kernel module. This ensures that the host system
///        remains stable despite the potentially unsafe operations performed by the
///        executor and the sandboxed code.
typedef struct {
#if defined(ARCH_X86_64)
    uint64_t cr0;
    uint64_t cr4;
    uint64_t efer;
    uint64_t lstar;
    uint64_t spec_ctrl;
    uint64_t prefetcher_ctrl;
    uint64_t syscfg;
    uint64_t fs_base;
    uint64_t gs_base;
    uint64_t gdtr_base;
    uint16_t gdtr_limit;
#elif defined(ARCH_ARM)
    uint64_t spsr_el1;
    uint64_t sp_el0;
    uint64_t sp_el1;
    uint64_t elr_el1;
#endif
} __attribute__((packed)) special_registers_t;

extern special_registers_t *orig_special_registers_state;

int set_special_registers(void);
void restore_special_registers(void);

int init_special_register_manager(void);
void free_special_register_manager(void);


#endif // _MSR_H_


================================================
FILE: rvzr/executor_km/include/svm.h
================================================
/// File: Header for svm.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _RVZR_EXECUTOR_SVM_H_
#define _RVZR_EXECUTOR_SVM_H_

#include <asm/svm.h>
#include <linux/types.h>

#include "svm_constants.h"

// =================================================================================================
// Virtual Machine Control Block (VMCB) definitions
#define VMCB_SIZE PAGE_SIZE

typedef struct {
    uint32_t intercept_cr;
    uint32_t intercept_dr;
    uint32_t intercept_exceptions;
    uint64_t intercept;
    uint32_t intercept_ext;
    uint8_t reserved_1[36];
    uint16_t pause_filter_thresh;
    uint16_t pause_filter_count;
    uint64_t iopm_base_pa;
    uint64_t msrpm_base_pa;
    uint64_t tsc_offset;
    uint32_t asid;
    uint8_t tlb_ctl;
    uint8_t reserved_2[3];
    uint32_t int_ctl;
    uint8_t int_vector;
    uint8_t reserved_3[3];
    uint8_t int_state;
    uint8_t reserved_4[7];
    uint64_t exit_code;
    uint64_t exit_info_1;
    uint64_t exit_info_2;
    uint64_t exit_int_info;
    uint64_t nested_ctl;
    uint64_t avic_vapic_bar;
    uint8_t reserved_5[8];
    uint32_t event_inj;
    uint32_t event_inj_err;
    uint64_t nested_cr3;
    uint64_t virt_ext;
    uint32_t clean;
    uint32_t reserved_6;
    uint64_t next_rip;
    uint8_t insn_len;
    uint8_t insn_bytes[15];
    uint64_t avic_backing_page;
    uint8_t reserved_7[8];
    uint64_t avic_logical_id;
    uint64_t avic_physical_id;
    uint8_t reserved_8[768];
} __attribute__((__packed__)) vmcb_control_t;

typedef struct {
    uint16_t selector;
    uint16_t attrib;
    uint32_t limit;
    uint64_t base;
} __attribute__((__packed__)) seg_t;

typedef struct {
    seg_t es;
    seg_t cs;
    seg_t ss;
    seg_t ds;
    seg_t fs;
    seg_t gs;
    seg_t gdtr;
    seg_t ldtr;
    seg_t idtr;
    seg_t tr;
    uint8_t reserved_1[43];
    uint8_t cpl;
    uint8_t reserved_2[4];
    uint64_t efer;
    uint64_t reserved_2a;
    uint64_t perf_ctl0;
    uint64_t perf_ctr0;
    uint64_t perf_ctl1;
    uint64_t perf_ctr1;
    uint64_t perf_ctl2;
    uint64_t perf_ctr2;
    uint64_t perf_ctl3;
    uint64_t perf_ctr3;
    uint64_t perf_ctl4;
    uint64_t perf_ctr4;
    uint64_t perf_ctl5;
    uint64_t perf_ctr5;
    uint64_t reserved_3;
    // uint8_t reserved_3[112];
    uint64_t cr4;
    uint64_t cr3;
    uint64_t cr0;
    uint64_t dr7;
    uint64_t dr6;
    uint64_t rflags;
    uint64_t rip;
    uint8_t reserved_4[88];
    uint64_t rsp;
    uint8_t reserved_5[24];
    uint64_t rax;
    uint64_t star;
    uint64_t lstar;
    uint64_t cstar;
    uint64_t sfmask;
    uint64_t kernel_gs_base;
    uint64_t sysenter_cs;
    uint64_t sysenter_esp;
    uint64_t sysenter_eip;
    uint64_t cr2;
    uint8_t reserved_6[32];
    uint64_t g_pat;
    uint64_t dbgctl;
    uint64_t br_from;
    uint64_t br_to;
    uint64_t last_excp_from;
    uint64_t last_excp_to;
} __attribute__((__packed__)) vmcb_save_t;

typedef struct {
    vmcb_control_t control;
    vmcb_save_t save;
} __attribute__((packed)) vmcb_t;


// =================================================================================================
// Module interface
#define VMCB_RIP_OFFSET offsetof(vmcb_t, save.rip)

extern bool svm_is_on;
extern uint64_t *vmcb_hpas;
extern uint64_t *vmcb_hvas;

int svm_check_cpu_compatibility(void);
int start_svm_operation(void);
void stop_svm_operation(void);
int store_orig_vmcb_state(void);
void restore_orig_vmcb_state(void);
int set_vmcb_state(void);
int print_svm_exit_info(void);

int init_svm(void);
void free_svm(void);

#endif // _RVZR_EXECUTOR_SVM_H_


================================================
FILE: rvzr/executor_km/include/svm_constants.h
================================================
/// File: Definitions of constants used by AMD SVM (Secure Virtual Machine) technology
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/msr-index.h>

#ifndef _RVZR_EXECUTOR_SVM_CONSTANTS_H_
#define _RVZR_EXECUTOR_SVM_CONSTANTS_H_

// =================================================================================================
// Default values for configuration registers and VMCB fields

// Could be read from cpuid
#define SVM_MAX_NUM_GUESTS 64 // DO NOT INCREASE without knowing exactly what you are doing

// -------------------------------------------------------------------------------------------------
// Guest control registers
#define MUST_SET_BITS_CR0_SVM_GUEST                                                                \
    (X86_CR0_PE | X86_CR0_PG | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM | X86_CR0_ET)
#define MUST_CLEAR_BITS_CR0_SVM_GUEST (X86_CR0_NW | X86_CR0_CD)

#define MUST_SET_BITS_CR4_SVM_GUEST                                                                \
    (X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR |        \
     X86_CR4_OSXMMEXCPT)
#define MUST_CLEAR_BITS_CR4_SVM_GUEST (X86_CR4_VME)

#define MUST_SET_BITS_EFER_SVM_GUEST   (EFER_SCE | EFER_LME | EFER_LMA | EFER_NX | EFER_SVME)
#define MUST_CLEAR_BITS_EFER_SVM_GUEST (EFER_LMSLE)

// -------------------------------------------------------------------------------------------------
// Segment attributes
#define MUST_SET_BITS_CS_SVM_GUEST                                                                 \
    (SVM_SELECTOR_P_MASK | SVM_SELECTOR_L_MASK | SVM_SELECTOR_WRITE_MASK)
#define MUST_SET_BITS_DS_SVM_GUEST                                                                 \
    (SVM_SELECTOR_P_MASK | SVM_SELECTOR_L_MASK | SVM_SELECTOR_WRITE_MASK)
#define MUST_SET_BITS_SS_SVM_GUEST                                                                 \
    (SVM_SELECTOR_P_MASK | SVM_SELECTOR_L_MASK | SVM_SELECTOR_WRITE_MASK)

// -------------------------------------------------------------------------------------------------
// VMCB control fields

// =================================================================================================
// Kernel compatibility: Constant definitions that are either missing in the kernel, or are
// inconsistent between versions

// We define VMCB bits here, as the definitions within the kernel are not stable between versions
#define VMCB_INTERCEPT_CR0_READ  0
#define VMCB_INTERCEPT_CR3_READ  3
#define VMCB_INTERCEPT_CR4_READ  4
#define VMCB_INTERCEPT_CR8_READ  8
#define VMCB_INTERCEPT_CR0_WRITE (16 + 0)
#define VMCB_INTERCEPT_CR3_WRITE (16 + 3)
#define VMCB_INTERCEPT_CR4_WRITE (16 + 4)
#define VMCB_INTERCEPT_CR8_WRITE (16 + 8)

#define VMCB_INTERCEPT_DR0_READ  0
#define VMCB_INTERCEPT_DR1_READ  1
#define VMCB_INTERCEPT_DR2_READ  2
#define VMCB_INTERCEPT_DR3_READ  3
#define VMCB_INTERCEPT_DR4_READ  4
#define VMCB_INTERCEPT_DR5_READ  5
#define VMCB_INTERCEPT_DR6_READ  6
#define VMCB_INTERCEPT_DR7_READ  7
#define VMCB_INTERCEPT_DR0_WRITE (16 + 0)
#define VMCB_INTERCEPT_DR1_WRITE (16 + 1)
#define VMCB_INTERCEPT_DR2_WRITE (16 + 2)
#define VMCB_INTERCEPT_DR3_WRITE (16 + 3)
#define VMCB_INTERCEPT_DR4_WRITE (16 + 4)
#define VMCB_INTERCEPT_DR5_WRITE (16 + 5)
#define VMCB_INTERCEPT_DR6_WRITE (16 + 6)
#define VMCB_INTERCEPT_DR7_WRITE (16 + 7)

enum {
    VMCB_INTERCEPT_INTR,
    VMCB_INTERCEPT_NMI,
    VMCB_INTERCEPT_SMI,
    VMCB_INTERCEPT_INIT,
    VMCB_INTERCEPT_VINTR,
    VMCB_INTERCEPT_SELECTIVE_CR0,
    VMCB_INTERCEPT_STORE_IDTR,
    VMCB_INTERCEPT_STORE_GDTR,
    VMCB_INTERCEPT_STORE_LDTR,
    VMCB_INTERCEPT_STORE_TR,
    VMCB_INTERCEPT_LOAD_IDTR,
    VMCB_INTERCEPT_LOAD_GDTR,
    VMCB_INTERCEPT_LOAD_LDTR,
    VMCB_INTERCEPT_LOAD_TR,
    VMCB_INTERCEPT_RDTSC,
    VMCB_INTERCEPT_RDPMC,
    VMCB_INTERCEPT_PUSHF,
    VMCB_INTERCEPT_POPF,
    VMCB_INTERCEPT_CPUID,
    VMCB_INTERCEPT_RSM,
    VMCB_INTERCEPT_IRET,
    VMCB_INTERCEPT_INTn,
    VMCB_INTERCEPT_INVD,
    VMCB_INTERCEPT_PAUSE,
    VMCB_INTERCEPT_HLT,
    VMCB_INTERCEPT_INVLPG,
    VMCB_INTERCEPT_INVLPGA,
    VMCB_INTERCEPT_IOIO_PROT,
    VMCB_INTERCEPT_MSR_PROT,
    VMCB_INTERCEPT_TASK_SWITCH,
    VMCB_INTERCEPT_FERR_FREEZE,
    VMCB_INTERCEPT_SHUTDOWN,
    VMCB_INTERCEPT_VMRUN,
    VMCB_INTERCEPT_VMMCALL,
    VMCB_INTERCEPT_VMLOAD,
    VMCB_INTERCEPT_VMSAVE,
    VMCB_INTERCEPT_STGI,
    VMCB_INTERCEPT_CLGI,
    VMCB_INTERCEPT_SKINIT,
    VMCB_INTERCEPT_RDTSCP,
    VMCB_INTERCEPT_ICEBP,
    VMCB_INTERCEPT_WBINVD,
    VMCB_INTERCEPT_MONITOR,
    VMCB_INTERCEPT_MWAIT,
    VMCB_INTERCEPT_MWAIT_COND,
    VMCB_INTERCEPT_XSETBV,
    VMCB_INTERCEPT_RDPRU,
    VMCB_INTERCEPT_EFER_WRITE,
};

enum {
    VMCB_INTERCEPT_ALL_INVLPGB,
    VMCB_INTERCEPT_INVALID_INVLPGB,
    VMCB_INTERCEPT_INVPCID,
    VMCB_INTERCEPT_MCOMMIT,
    VMCB_INTERCEPT_TLBSYNC,
    VMCB_INTERCEPT_BUS_LOCK,
    VMCB_INTERCEPT_HLT_IF_NOT_VINTR,
};

#endif // _RVZR_EXECUTOR_SVM_CONSTANTS_H_


================================================
FILE: rvzr/executor_km/include/test_case_parser.h
================================================
/// File: Header for the test case parser and manager
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _TEST_CASE_PARSER_H_
#define _TEST_CASE_PARSER_H_

#include "actor.h"

#define MAX_SECTIONS            MAX_ACTORS
#define MAX_SYMBOLS             128
#define MAX_SECTION_SIZE        4096 // NOTE: must be exactly 1 page to detect sysfs buffering
#define MAX_LOADED_SECTION_SIZE (4096 * 2)
#define TC_HEADER_SIZE          (2 * sizeof(uint64_t))

typedef uint64_t section_size_t;
typedef uint64_t section_metadata_reserved_t;
typedef uint64_t section_id_t;
typedef uint64_t symbol_offset_t;
typedef uint64_t symbol_id_t;
typedef uint64_t symbol_args_t;

typedef struct {
    actor_id_t owner;
    section_size_t size;
    section_metadata_reserved_t reserved;
} tc_section_metadata_entry_t;

typedef struct {
    char code[MAX_SECTION_SIZE];
} tc_section_t;

typedef struct {
    actor_id_t owner;
    symbol_offset_t offset;
    symbol_id_t id;
    symbol_args_t args;
} tc_symbol_entry_t;

typedef struct {
    bool includes_vm_actors;
    bool includes_user_actors;
    bool has_explicit_fault_handler;
} tc_features_t;

typedef struct {
    tc_features_t features;
    size_t actor_table_size;
    size_t symbol_table_size;
    size_t metadata_size;
    size_t sections_size;
    actor_metadata_t *actor_table;
    tc_symbol_entry_t *symbol_table;
    tc_section_metadata_entry_t *metadata;
    tc_section_t *sections;
} test_case_t;

extern test_case_t *test_case;

ssize_t parse_test_case_buffer(const char *buf, size_t count, bool *finished);
bool tc_parsing_completed(void);
int init_test_case_parser(void);
void free_test_case_parser(void);

#endif // _TEST_CASE_PARSER_H_


================================================
FILE: rvzr/executor_km/include/vmx.h
================================================
/// File: Header for vmx.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _RVZR_EXECUTOR_VMX_H_
#define _RVZR_EXECUTOR_VMX_H_

#include <asm/vmx.h>
#include <linux/types.h>

// =================================================================================================
// Kernel compatibility
#ifdef FEAT_CTL_VMX_ENABLED_OUTSIDE_SMX
#define FEATURE_VMX_ENABLED_OUTSIDE_SMX FEAT_CTL_VMX_ENABLED_OUTSIDE_SMX
#elif defined(FEATURE_CONTROL_VMXON_ENABLED_OUTSIDE_SMX)
#define FEATURE_VMX_ENABLED_OUTSIDE_SMX FEATURE_CONTROL_VMXON_ENABLED_OUTSIDE_SMX
#else
#error "FEATURE_VMX_ENABLED_OUTSIDE_SMX not defined"
#endif

#ifdef FEAT_CTL_LOCKED
#define FEATURE_CTL_LOCKED FEAT_CTL_LOCKED
#elif defined(FEATURE_CONTROL_LOCKED)
#define FEATURE_CTL_LOCKED FEATURE_CONTROL_LOCKED
#else
#error "FEATURE_CTL_LOCKED not defined"
#endif

#ifdef MSR_IA32_FEAT_CTL
#define MSR_FEATURE_CONTROL MSR_IA32_FEAT_CTL
#elif defined(MSR_IA32_FEATURE_CONTROL)
#define MSR_FEATURE_CONTROL MSR_IA32_FEATURE_CONTROL
#else
#error "MSR_FEATURE_CONTROL not defined"
#endif

#ifndef SECONDARY_EXEC_XSAVES
#define SECONDARY_EXEC_XSAVES SECONDARY_EXEC_ENABLE_XSAVES
#endif

// =================================================================================================
// Host VMX data structures
#define VMXON_SIZE 4096 // 4KB, as defined in SDM "Enabling and Entering VMX Operation"
#define VMCS_SIZE  4096 // 4KB, as defined in SDM "Format of the VMCS Region"

typedef struct {
    uint32_t revision_id : 30;
    uint32_t reserved_31 : 1;
    uint8_t data[VMXON_SIZE - 4];
} __attribute__((packed)) vmxon_region_t;

typedef struct {
    uint32_t revision_id : 30;
    uint32_t reserved_31 : 1;
    uint32_t abort_indicator;
    uint8_t data[VMCS_SIZE - 8];
} __attribute__((packed)) vmcs_t;

// =================================================================================================
// Module interface
extern bool vmx_is_on;
extern uint64_t *vmcs_hpas;

int vmx_check_cpu_compatibility(void);
int start_vmx_operation(void);
void stop_vmx_operation(void);
int store_orig_vmcs_state(void);
void restore_orig_vmcs_state(void);
int set_vmcs_state(void);
int print_vmx_exit_info(void);

int init_vmx(void);
void free_vmx(void);

#endif // _RVZR_EXECUTOR_VMX_H_


================================================
FILE: rvzr/executor_km/include/vmx_config.h
================================================
/// File: Configuration constants for VMX
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef _VMX_CONFIG_H_
#define _VMX_CONFIG_H_

#include <asm/vmx.h>

// Could be read from cpuid
#define VMX_MAX_NUM_GUESTS 64 // DO NOT INCREASE without knowing exactly what you are doing

// Constants missing in (some versions of) Linux
#ifndef CPU_BASED_ACTIVATE_TERTIARY_CONTROLS
#define CPU_BASED_ACTIVATE_TERTIARY_CONTROLS (1ULL << 17)
#endif
#ifndef SECONDARY_EXEC_RDTSCP
#define SECONDARY_EXEC_RDTSCP (1ULL << 3)
#endif
#define SECONDARY_EXEC_EPT_VIOLATION_CAUSES_VE (1ULL << 18)
#define SECONDARY_EXEC_PASID_TRANSLATION       (1ULL << 21)
#define SECONDARY_EXEC_SUBPAGE_WRITE_PERM      (1ULL << 23)
#define SECONDARY_EXEC_ENABLE_PCONFIG          (1ULL << 27)
#define SECONDARY_EXEC_ENABLE_ENCLV_EXITING    (1ULL << 28)

#define VM_EXIT_UINV               (1ULL << 19)
#define VM_ENTRY_CET               (1ULL << 20)
#define VM_ENTRY_LOAD_IA32_LBR_CTL (1ULL << 21)
#define VM_ENTRY_LOAD_IA32_PKRS    (1ULL << 22)

// ----------------------------------------------------------------------------------------------
// Guest control registers
#define MUST_SET_BITS_CR0_VMX_GUEST                                                                    \
    (X86_CR0_PE | X86_CR0_PG | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM | X86_CR0_ET)
#define MUST_CLEAR_BITS_CR0_VMX_GUEST (X86_CR0_NW | X86_CR0_CD)

#define MUST_SET_BITS_CR4_VMX_GUEST                                                                    \
    (X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR |        \
     X86_CR4_OSXMMEXCPT | X86_CR4_VMXE | X86_CR4_PCIDE)
#define MUST_CLEAR_BITS_CR4_VMX_GUEST                                                                  \
    (X86_CR4_VME | X86_CR4_PVI | X86_CR4_TSD | X86_CR4_UMIP | X86_CR4_SMXE | X86_CR4_FSGSBASE |    \
     X86_CR4_OSXSAVE)

// ----------------------------------------------------------------------------------------------
// VMCS control fields

// Table 25-5. Definitions of Pin-Based VM-Execution Controls
// IMPORTANT: never combine setting of PIN_BASED_EXT_INTR_MASK and VM_EXIT_ACK_INTR_ON_EXIT
//            (i.e., at least one must be disabled); otherwise, interrupts lead to system crash
#define MUST_SET_PIN_BASED_VM_EXEC_CONTROL                                                         \
    (PIN_BASED_NMI_EXITING | PIN_BASED_VIRTUAL_NMIS | PIN_BASED_VMX_PREEMPTION_TIMER)
#define MUST_CLEAR_PIN_BASED_VM_EXEC_CONTROL (PIN_BASED_EXT_INTR_MASK | PIN_BASED_POSTED_INTR)

// Table 25-6. Definitions of Primary Processor-Based VM-Execution Controls
// DO NOT add CPU_BASED_RDPMC_EXITING because we may need it if guest primes or probes
#define MUST_SET_PRIMARY_VM_EXEC_CONTROL                                                           \
    (CPU_BASED_INTR_WINDOW_EXITING | CPU_BASED_HLT_EXITING | CPU_BASED_INVLPG_EXITING |            \
     CPU_BASED_MWAIT_EXITING | CPU_BASED_CR3_LOAD_EXITING | CPU_BASED_CR3_STORE_EXITING |          \
     CPU_BASED_CR8_LOAD_EXITING | CPU_BASED_CR8_STORE_EXITING | CPU_BASED_MOV_DR_EXITING |         \
     CPU_BASED_UNCOND_IO_EXITING | CPU_BASED_MONITOR_EXITING | CPU_BASED_PAUSE_EXITING |           \
     CPU_BASED_ACTIVATE_SECONDARY_CONTROLS | CPU_BASED_NMI_WINDOW_EXITING)
#define MUST_CLEAR_PRIMARY_VM_EXEC_CONTROL                                                         \
    (CPU_BASED_USE_TSC_OFFSETTING | CPU_BASED_RDPMC_EXITING | CPU_BASED_RDTSC_EXITING |            \
     CPU_BASED_ACTIVATE_TERTIARY_CONTROLS | CPU_BASED_TPR_SHADOW | CPU_BASED_USE_IO_BITMAPS |      \
     CPU_BASED_MONITOR_TRAP_FLAG | CPU_BASED_USE_MSR_BITMAPS)

// Table 25-7. Definitions of Secondary Processor-Based VM-Execution Controls
#define MUST_SET_SECONDARY_VM_EXEC_CONTROL                                                         \
    (SECONDARY_EXEC_ENABLE_EPT | SECONDARY_EXEC_DESC | SECONDARY_EXEC_WBINVD_EXITING |             \
     SECONDARY_EXEC_ENABLE_INVPCID | SECONDARY_EXEC_RDRAND_EXITING |                               \
     SECONDARY_EXEC_RDSEED_EXITING)
#define MUST_CLEAR_SECONDARY_VM_EXEC_CONTROL                                                       \
    (SECONDARY_EXEC_VIRTUALIZE_APIC_ACCESSES | SECONDARY_EXEC_RDTSCP |                             \
     SECONDARY_EXEC_VIRTUALIZE_X2APIC_MODE | SECONDARY_EXEC_ENABLE_VPID |                          \
     SECONDARY_EXEC_UNRESTRICTED_GUEST | SECONDARY_EXEC_APIC_REGISTER_VIRT |                       \
     SECONDARY_EXEC_VIRTUAL_INTR_DELIVERY | SECONDARY_EXEC_ENABLE_VMFUNC |                         \
     SECONDARY_EXEC_ENCLS_EXITING | SECONDARY_EXEC_ENABLE_PML |                                    \
     SECONDARY_EXEC_EPT_VIOLATION_CAUSES_VE | SECONDARY_EXEC_PT_CONCEAL_VMX |                      \
     SECONDARY_EXEC_XSAVES | SECONDARY_EXEC_PASID_TRANSLATION |                                    \
     SECONDARY_EXEC_MODE_BASED_EPT_EXEC | SECONDARY_EXEC_SUBPAGE_WRITE_PERM |                      \
     SECONDARY_EXEC_PT_USE_GPA | SECONDARY_EXEC_TSC_SCALING |                                      \
     SECONDARY_EXEC_ENABLE_USR_WAIT_PAUSE | SECONDARY_EXEC_ENABLE_PCONFIG |                        \
     SECONDARY_EXEC_ENABLE_ENCLV_EXITING | SECONDARY_EXEC_SHADOW_VMCS)

#ifdef VMBUILD
#undef MUST_SET_SECONDARY_VM_EXEC_CONTROL
#define MUST_SET_SECONDARY_VM_EXEC_CONTROL                                                         \
    (SECONDARY_EXEC_ENABLE_EPT | SECONDARY_EXEC_DESC | SECONDARY_EXEC_WBINVD_EXITING |             \
     SECONDARY_EXEC_RDRAND_EXITING | SECONDARY_EXEC_RDSEED_EXITING)
#endif

// Misc.
#define DEFAULT_EXCEPTION_BITMAP 0xFFFFFFFF // all exceptions are redirected to host

// Exit/entry controls
#define MUST_SET_EXIT_CTRL (VM_EXIT_SAVE_DEBUG_CONTROLS | VM_EXIT_HOST_ADDR_SPACE_SIZE)
#define MUST_CLEAR_EXIT_CTRL                                                                       \
    (VM_EXIT_LOAD_IA32_PERF_GLOBAL_CTRL | VM_EXIT_SAVE_IA32_PAT | VM_EXIT_LOAD_IA32_PAT |          \
     VM_EXIT_SAVE_IA32_EFER | VM_EXIT_LOAD_IA32_EFER | VM_EXIT_SAVE_VMX_PREEMPTION_TIMER |         \
     VM_EXIT_CLEAR_BNDCFGS | VM_EXIT_PT_CONCEAL_PIP | VM_EXIT_CLEAR_IA32_RTIT_CTL |                \
     VM_EXIT_ACK_INTR_ON_EXIT)

#define MUST_SET_ENTRY_CTRL (VM_ENTRY_LOAD_DEBUG_CONTROLS | VM_ENTRY_IA32E_MODE)
#define MUST_CLEAR_ENTRY_CTRL                                                                      \
    (VM_ENTRY_SMM | VM_ENTRY_DEACT_DUAL_MONITOR | VM_ENTRY_LOAD_IA32_PERF_GLOBAL_CTRL |            \
     VM_ENTRY_LOAD_IA32_PAT | VM_ENTRY_LOAD_IA32_EFER | VM_ENTRY_LOAD_BNDCFGS |                    \
     VM_ENTRY_PT_CONCEAL_PIP | VM_ENTRY_LOAD_IA32_RTIT_CTL | VM_EXIT_UINV | VM_ENTRY_CET |         \
     VM_ENTRY_LOAD_IA32_LBR_CTL | VM_ENTRY_LOAD_IA32_PKRS)

#endif // _VMX_CONFIG_H_


================================================
FILE: rvzr/executor_km/input_parser.c
================================================
/// File:
///   - Parsing inputs
///   - Management of input-related data structures
///   - Accessors to the input data
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/slab.h> // PAGE_SIZE

#include "actor.h"
#include "input_parser.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

input_batch_t *inputs = NULL; // global
size_t n_inputs = 0;          // global

// =================================================================================================
// State machine for input acquisition
// =================================================================================================
static bool is_receiving_inputs = false;
static uint64_t cursor = 0;
static size_t highest_n_actors = 0;
static size_t highest_n_inputs = 0;
static input_fragment_metadata_entry_t *allocated_metadata;
static input_fragment_t *allocated_data;

/// Initialize the state machine
///
static int start_batch_input_parsing(const char *buf)
{
    int ret = 0;

    // Restart parsing
    cursor = 0;

    // Create a new batch
    SAFE_FREE(inputs);
    inputs = CHECKED_MALLOC(sizeof(input_batch_t));

    // Get the number the number of actors
    // (here, we just check that it matches the previous value from test_case.c)
    uint64_t new_n_actors = ((uint64_t *)buf)[0];
    ASSERT_MSG(new_n_actors == n_actors, "start_batch_input_parsing",
               "Mismatch in n_actors;"
               " Either inputs were loaded befor the test case,\n"
               "or the declared n_actors does not match "
               "(n_actors = %lu, new_n_actors = %llu)\n",
               n_actors, new_n_actors);
    ret += 8;

    // Get the number of inputs
    uint64_t new_n_inputs = ((uint64_t *)buf)[1];
    ASSERT(new_n_inputs != 0, "start_batch_input_parsing");
    ASSERT_MSG((int)new_n_inputs <= MAX_INPUTS, "start_batch_input_parsing",
               "n_inputs (%llu) > MAX_INPUTS (%u)\n", new_n_inputs, MAX_INPUTS);
    ret += 8;

    // Store object sizes
    //       Note: do not multiply by the number of inputs per actor for metadata,
    //       because we keep the same metadata for each run
    inputs->metadata_size = new_n_actors * sizeof(input_fragment_metadata_entry_t);
    inputs->data_size = new_n_actors * new_n_inputs * sizeof(input_fragment_t);

    // If the number of actors or the number of inputs has increased, we need to re-allocate
    if (new_n_actors > highest_n_actors || new_n_inputs > highest_n_inputs || !allocated_metadata ||
        !allocated_data) {
        SAFE_FREE(allocated_metadata);
        SAFE_VFREE(allocated_data);
        allocated_metadata = CHECKED_MALLOC(inputs->metadata_size);
        allocated_data = CHECKED_VMALLOC(inputs->data_size);
        highest_n_actors = new_n_actors;
        highest_n_inputs = new_n_inputs;
    }

    // Update globals
    inputs->metadata = allocated_metadata;
    inputs->data = allocated_data;
    n_inputs = new_n_inputs;
    // note: n_actors is not updated here; test_case.c is responsible for that

    ASSERT(ret < PAGE_SIZE, "start_batch_input_parsing");
    return ret;
}

/// Parse the inputs sent via sysfs in RDBF format
/// (see docs/devel/binary-formats.md for the format description)
///
ssize_t parse_input_buffer(const char *buf, size_t count, bool *finished)
{
    ssize_t consumed_bytes = 0;
    ssize_t byte_id = 0;

    if (!is_receiving_inputs) // Starting a a new batch
    {
        // Consume the fixed-size part of the batch
        // We assume that this part is small enough to fit into the minimum buffer size,
        // thus it does not require multiple calls to this function
        consumed_bytes = start_batch_input_parsing(buf);
        cursor += consumed_bytes;
        if (consumed_bytes <= 0)
            return -1;

        is_receiving_inputs = true;
    } else if (cursor < BATCH_HEADER_SIZE + inputs->metadata_size) // Parsing metadata
    {
        size_t metadata_cursor = cursor - BATCH_HEADER_SIZE;
        size_t end = inputs->metadata_size;
        for (; metadata_cursor < end && byte_id < count;) {
            ((char *)inputs->metadata)[metadata_cursor] = buf[byte_id];
            byte_id++;
            metadata_cursor++;
        }
        cursor = metadata_cursor + BATCH_HEADER_SIZE;
        consumed_bytes = byte_id;
    } else // Parsing data
    {
        // FIXME: this implementation is not optimal performance-wise,
        // because it will copy the unused data between fragment_size and FRAGMENT_SIZE_ALIGNED
        // See Flavien's implementation for a better one.
        size_t data_cursor = cursor - inputs->metadata_size - BATCH_HEADER_SIZE;
        size_t end = inputs->data_size;
        for (; data_cursor < end && byte_id < count;) {
            ((char *)inputs->data)[data_cursor] = buf[byte_id];
            byte_id++;
            data_cursor++;
        }
        cursor = data_cursor + inputs->metadata_size + BATCH_HEADER_SIZE;
        consumed_bytes = byte_id;
    }

    // Check whether we are done
    size_t data_end = BATCH_HEADER_SIZE + inputs->metadata_size + inputs->data_size;
    if (cursor >= data_end) {
        is_receiving_inputs = false;
        *finished = true;
    }
    // printk(KERN_ERR "parse_input_buffer: consumed_bytes = %lu; count = %lu; cursor = %llu; end =
    // "
    //                 "%lu; finished = %d\n",
    //        consumed_bytes, count, cursor, data_end, *finished);
    return consumed_bytes;
}

// =================================================================================================
// Misc. functions
// =================================================================================================

/// @brief Get the input fragment from the dynamic array
/// @param actor_id: 0 is guest 0, 1 is guest 1, and host is last
/// @param input_id
/// @return The input fragment for input_id of actor_id
input_fragment_t *get_input_fragment(uint64_t input_id, uint64_t actor_id)
{
    ASSERT_ENULL(inputs != NULL, "get_input_fragment");
    if (actor_id >= n_actors) {
        PRINT_ERRS("get_input_fragment", "actor_id (%llu) >= n_actors (%lu)\n", actor_id, n_actors);
        return NULL;
    }
    if (input_id >= n_inputs) {
        PRINT_ERRS("get_input_fragment", "input_id (%llu) >= n_inputs (%lu)\n", input_id, n_inputs);
        return NULL;
    }

    return &inputs->data[(actor_id * n_inputs) + input_id];
}

/// @brief Unsafe version of get_input_fragment
/// @param input_id
/// @param actor_id
/// @return
input_fragment_t *get_input_fragment_unsafe(uint64_t input_id, uint64_t actor_id)
{
    return &inputs->data[(input_id * n_actors) + actor_id];
}

/// Getter for is_receiving_inputs
///
bool input_parsing_completed(void) { return !is_receiving_inputs; }

// =================================================================================================
int init_input_parser(void)
{
    is_receiving_inputs = false;
    cursor = 0;
    n_inputs = 0;
    inputs = CHECKED_MALLOC(sizeof(input_batch_t));
    allocated_data = CHECKED_VMALLOC(sizeof(input_fragment_t));
    allocated_metadata = CHECKED_MALLOC(sizeof(input_fragment_metadata_entry_t));
    inputs->data_size = 0;
    inputs->metadata_size = 0;
    inputs->data = allocated_data;
    inputs->metadata = allocated_metadata;
    return 0;
}

void free_input_parser(void)
{
    SAFE_FREE(inputs);
    SAFE_FREE(allocated_metadata);
    SAFE_VFREE(allocated_data);
}


================================================
FILE: rvzr/executor_km/macro_expansion.c
================================================
/// File: Expansion of macros in the test case; used primarily by code_loader.c
///       This file contains architecture-independent code for expanding macros in the test case.
///       For concrete architecture-specific implementations of macros, see <arch>/macros.c.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "hardware_desc.h"

#include "asm_snippets.h"
#include "fault_handler.h"
#include "macro_expansion.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

// Max sizes for sanity checks
#define MAX_MACRO_START_OFFSET 0x100
#define MAX_MACRO_LENGTH       0x800

static size_t main_prologue_size = 0;

// =================================================================================================
// Helper functions
// =================================================================================================
/// @brief Setter/getter for the module variable main_prologue_size
///        This interface is necessary because the main section does not set from offset zero,
///        and instead starts from a hardcoded prologue. To take this offset into account,
///        Code Loader passes the size of the prologue to the Macros Loader, and then
///        arch-specific macros can query this size to calculate the correct function address.
/// @param size
void set_main_prologue_size(size_t size) { main_prologue_size = size; }
size_t get_main_prologue_size(void) { return main_prologue_size; }

/// @brief Determine the macro subtype from the macro ID and current configuration
/// @param macro_id ID of the macro
/// @return Pointer to the macro descriptor
static macro_descr_t *get_macro_subtype_from_id(uint64_t macro_id)
{
    // determine macro subtype
    macro_subtype_e macro_subtype = TYPE_UNDEFINED;
    switch (macro_id) {
    case MACRO_MEASUREMENT_START:
        switch (measurement_mode) {
        case PRIME_PROBE:
            macro_subtype = TYPE_PRIME;
            break;
        case FAST_PRIME_PROBE:
            macro_subtype = TYPE_FAST_PRIME;
            break;
        case PARTIAL_PRIME_PROBE:
            macro_subtype = TYPE_PARTIAL_PRIME;
            break;
        case FAST_PARTIAL_PRIME_PROBE:
            macro_subtype = TYPE_FAST_PARTIAL_PRIME;
            break;
        case FLUSH_RELOAD:
            macro_subtype = TYPE_FLUSH;
            break;
        case EVICT_RELOAD:
            macro_subtype = TYPE_EVICT;
            break;
        case TSC:
            macro_subtype = TYPE_TSC_START;
            break;
        default:
            PRINT_ERRS("get_macro_subtype_from_id", "misconfigured measurement_mode\n");
            return NULL;
        }
        break;
    case MACRO_FAULT_HANDLER_WITH_MEASUREMENT:
        switch (measurement_mode) {
        case PRIME_PROBE:
        case FAST_PRIME_PROBE:
        case PARTIAL_PRIME_PROBE:
        case FAST_PARTIAL_PRIME_PROBE:
            macro_subtype = TYPE_FAULT_AND_PROBE;
            break;
        case FLUSH_RELOAD:
        case EVICT_RELOAD:
            macro_subtype = TYPE_FAULT_AND_RELOAD;
            break;
        case TSC:
            macro_subtype = TYPE_FAULT_AND_TSC_END;
            break;
        default:
            PRINT_ERRS("get_macro_subtype_from_id", "misconfigured measurement_mode\n");
            return NULL;
        }
        break;
    case MACRO_MEASUREMENT_END:
        switch (measurement_mode) {
        case PRIME_PROBE:
        case FAST_PRIME_PROBE:
        case PARTIAL_PRIME_PROBE:
        case FAST_PARTIAL_PRIME_PROBE:
            macro_subtype = TYPE_PROBE;
            break;
        case FLUSH_RELOAD:
        case EVICT_RELOAD:
            macro_subtype = TYPE_RELOAD;
            break;
        case TSC:
            macro_subtype = TYPE_TSC_END;
            break;
        default:
            PRINT_ERRS("get_macro_subtype_from_id", "misconfigured measurement_mode\n");
            return NULL;
        }
        break;
    case MACRO_SWITCH_K2U:
        macro_subtype = TYPE_SWITCH_K2U;
        break;
    case MACRO_SWITCH_U2K:
        macro_subtype = TYPE_SWITCH_U2K;
        break;
    case MACRO_SWITCH_H2G:
        macro_subtype = TYPE_SWITCH_H2G;
        break;
    case MACRO_SWITCH_G2H:
        macro_subtype = TYPE_SWITCH_G2H;
        break;
    case MACRO_SET_H2G_TARGET:
        macro_subtype = TYPE_SET_H2G_TARGET;
        break;
    case MACRO_SET_G2H_TARGET:
        macro_subtype = TYPE_SET_G2H_TARGET;
        break;
    case MACRO_FAULT_HANDLER:
        macro_subtype = TYPE_FAULT_HANDLER;
        break;
    case MACRO_SWITCH:
        macro_subtype = TYPE_SWITCH;
        break;
    case MACRO_SET_K2U_TARGET:
        macro_subtype = TYPE_SET_K2U_TARGET;
        break;
    case MACRO_SET_U2K_TARGET:
        macro_subtype = TYPE_SET_U2K_TARGET;
        break;
    case MACRO_LANDING_K2U:
        macro_subtype = TYPE_LANDING_K2U;
        break;
    case MACRO_LANDING_U2K:
        macro_subtype = TYPE_LANDING_U2K;
        break;
    case MACRO_LANDING_H2G:
        macro_subtype = TYPE_LANDING_H2G;
        break;
    case MACRO_LANDING_G2H:
        macro_subtype = TYPE_LANDING_G2H;
        break;
    case MACRO_SET_DATA_PERMISSIONS:
        macro_subtype = TYPE_SET_DATA_PERMISSIONS;
        break;
    default:
        PRINT_ERRS("get_macro_subtype_from_id", "macro_id %llu is not valid\n", macro_id);
        return NULL;
    }

    macro_descr_t *descr = &macro_descriptors[macro_subtype];
    if (descr->start == NULL && descr->body == NULL) {
        PRINT_ERRS("get_macro_subtype_from_id", "macro_id %llu is not implemented\n", macro_id);
        return NULL;
    }
    return descr;
}

/// @brief Check if the given pointer points to a token marking the start of a macro
/// @param ptr
/// @return True if the pointer points to the start of a macro, false otherwise
static inline bool is_macro_start(uint8_t *ptr)
{
    return (ptr)[7] == ((MACRO_START >> 56) & 0xFF) && (ptr)[6] == ((MACRO_START >> 48) & 0xFF) &&
           (ptr)[5] == ((MACRO_START >> 40) & 0xFF) && (ptr)[4] == ((MACRO_START >> 32) & 0xFF) &&
           (ptr)[3] == ((MACRO_START >> 24) & 0xFF) && (ptr)[2] == ((MACRO_START >> 16) & 0xFF) &&
           (ptr)[1] == ((MACRO_START >> 8) & 0xFF) && (ptr)[0] == ((MACRO_START) & 0xFF);
}

/// @brief Check if the given pointer points to a token marking the end of a macro
/// @param ptr
/// @return True if the pointer points to the end of a macro, false otherwise
static inline bool is_macro_end(uint8_t *ptr)
{
    return (ptr)[7] == ((MACRO_END >> 56) & 0xFF) && (ptr)[6] == ((MACRO_END >> 48) & 0xFF) &&
           (ptr)[5] == ((MACRO_END >> 40) & 0xFF) && (ptr)[4] == ((MACRO_END >> 32) & 0xFF) &&
           (ptr)[3] == ((MACRO_END >> 24) & 0xFF) && (ptr)[2] == ((MACRO_END >> 16) & 0xFF) &&
           (ptr)[1] == ((MACRO_END >> 8) & 0xFF) && (ptr)[0] == ((MACRO_END) & 0xFF);
}

/// @brief Replace the NOP at the given location with a relative jump to the expanded macro
///        and add a fence after the jump to prevent straight-line speculation
/// @param dest Destination buffer
/// @param target Target address for the jump
/// @return Size of the added code, in bytes
static inline uint64_t insert_relative_jmp_n_fence(uint8_t *dest, int32_t target)
{
    uint64_t cursor = 0;

#if defined(ARCH_X86_64)
    const int jmp_opcode_size = 5;
    target -= jmp_opcode_size;

    // jmp *target
    dest[cursor++] = 0xe9; // start of the jump opcode
    *((uint32_t *)&dest[cursor]) = target;
    cursor += 4;

    // lfence
    dest[cursor++] = 0x0f;
    dest[cursor++] = 0xae;
    dest[cursor++] = 0xe8;
#elif defined(ARCH_ARM)
    // offsets in ARM are in dwords
    target = target / 4;

    // the target for a jump is a 26-bit signed offset from the current PC
    int target_sign = target < 0 ? 1 : 0;
    ASSERT(target < 0x02000000 && target >= -0x02000000, "insert_relative_jmp_n_fence");
    target = (target & 0x3FFFFFF) | (target_sign << 25);

    // b *target
    *((uint32_t *)&dest[cursor]) = 0x14000000; // start of the jump opcode
    *((uint32_t *)&dest[cursor]) |= target;
    cursor += 4;

    // isb
    *((uint32_t *)&dest[cursor]) = 0xd5033fdf;
    cursor += 4;

    // dsb SY
    *((uint32_t *)&dest[cursor]) = 0xd5033f9f;
    cursor += 4;

#endif

    return cursor;
}

// =================================================================================================
// Macro expansion logic
// =================================================================================================

/// @brief Dynamically generate the configurable part of the macro
/// @param[in] descr Pointer to the macro descriptor
/// @param[in] args Compressed representation of the macro arguments, as received from the test case
///            symbol table
/// @param[in] owner ID of the actor owning the macro
/// @param[out] dest Pointer to the destination buffer
/// @return Size of the added code, in bytes
static uint64_t inject_macro_configurable_part(macro_descr_t *descr, uint64_t args, uint64_t owner,
                                               uint8_t *dest)
{
    // Extract the macro arguments
    macro_args_t args_struct = {
        .arg1 = (args >> 0x00) & 0xFFFF,
        .arg2 = (args >> 0x10) & 0xFFFF,
        .arg3 = (args >> 0x20) & 0xFFFF,
        .arg4 = (args >> 0x30) & 0xFFFF,
        .owner = owner,
    };

    // Generate the macro start code
    size_t cursor = descr->start(args_struct, dest);
    return cursor;
}

/// @brief Inject the static part of the macro into destination
/// @param[in] descr Pointer to the macro descriptor
/// @param[out] dest Pointer to the destination buffer
/// @return Size of the added code, in bytes
static uint64_t inject_macro_static_part(macro_descr_t *descr, uint8_t *dest)
{
    // Get pointers to the start and the end of the static part of the macro
    uint8_t *macro_wrapper_start = (uint8_t *)descr->body;
    uint8_t *macro_start = macro_wrapper_start;
    while (!is_macro_start(macro_start)) {
        macro_start++;
        ASSERT(macro_start - macro_wrapper_start < MAX_MACRO_START_OFFSET, "get_macro_ptr");
    }
    macro_start += MACRO_START_TOKEN_LENGTH;

    uint8_t *macro_end = macro_start;
    while (!is_macro_end(macro_end)) {
        macro_end++;
        ASSERT(macro_end - macro_start < MAX_MACRO_LENGTH, "get_macro_ptr");
    }
    if (macro_end - macro_start == 0)
        return 0;

    // Copy the static part of the macro
    size_t size = macro_end - macro_start;
    memcpy(dest, macro_start, size);
    return size;
}

/// @brief Expand a macro into the destination buffer (macro_dest) and replace the nop at
///        jmp_location with a relative jump to the expanded macro
/// @param macro Macro to expand
/// @param[in] dest Destination address for placing the JMP instruction
/// @param[in] macro_dest Destination buffer for the expanded macro
/// @param[out] macro_size Size of the expanded macro
/// @return 0 on success, -1 on failure
int expand_macro(tc_symbol_entry_t *macro, uint8_t *code_dest, uint8_t *macro_dest,
                 size_t *macro_size)
{
    uint64_t code_cursor = 0;
    uint64_t macro_cursor = 0;

    // Get the macro type
    symbol_id_t type_id = macro->id;
    ASSERT(type_id != 0, "expand_macro");

    // Get the macro descriptor
    macro_descr_t *descr = get_macro_subtype_from_id(type_id);
    ASSERT(descr != NULL, "expand_macro");

    // Code area: Replace the NOP with a relative jump to the expanded macro + fence
    int32_t target = (int32_t)(&macro_dest[macro_cursor] - code_dest);
    code_cursor += insert_relative_jmp_n_fence(&code_dest[code_cursor], target);

    // Macro area: Inject the configurable part of the macro
    if (descr->start != NULL) {
        macro_cursor += inject_macro_configurable_part(descr, macro->args, macro->owner,
                                                       &macro_dest[macro_cursor]);
    }
    ASSERT(macro_cursor >= 0, "expand_macro");

    // Macro area: Inject the static part of the macro
    if (descr->body != NULL) {
        macro_cursor += inject_macro_static_part(descr, &macro_dest[macro_cursor]);
    }
    ASSERT(macro_cursor >= 0, "expand_macro");

    // Macro area: Insert a relative jump backwards
    target = (int32_t)(&code_dest[code_cursor] - &macro_dest[macro_cursor]);
    macro_cursor += insert_relative_jmp_n_fence(&macro_dest[macro_cursor], target);

    *macro_size = macro_cursor;
    return 0;
}


================================================
FILE: rvzr/executor_km/main.c
================================================
/// File: Kernel module interface
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

// clang-format off
#include <linux/kernel.h>
#include <linux/init.h>
#include <linux/module.h>
#include <linux/sysfs.h>
#include <linux/version.h>
#include <linux/kobject.h>
#include <asm/processor.h>
// clang-format on

#include "hardware_desc.h"

#include "actor.h"
#include "code_loader.h"
#include "data_loader.h"
#include "hardware_desc.h"
#include "input_parser.h"
#include "macro_expansion.h"
#include "main.h"
#include "measurement.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

#include "fault_handler.h"
#include "page_tables_common.h"
#include "page_tables_guest.h"
#include "page_tables_host.h"
#include "perf_counters.h"
#include "special_registers.h"

// ISA-specific includes
#if defined(ARCH_X86_64)
#include "svm.h"
#include "vmx.h"
#elif defined(ARCH_ARM)
#include <asm/cpufeature.h>
#endif

// =================================================================================================
// Kernel compatibility handling

// Version-dependent includes
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 6, 6)
#ifdef ARCH_X86_64
#include <../arch/x86/include/asm/io.h>
#endif
#endif

#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 7, 0)
#define KPROBE_LOOKUP 1
#include <linux/kprobes.h>
static struct kprobe kp = {.symbol_name = "kallsyms_lookup_name"};
#endif

#if LINUX_VERSION_CODE <= KERNEL_VERSION(4, 12, 0)
#include <asm/cacheflush.h>
#endif

#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 4, 0)
#include <linux/kallsyms.h>
int (*set_memory_x)(unsigned long, int) = 0;
int (*set_memory_nx)(unsigned long, int) = 0;
struct mm_struct init_mm = {0};
#else
#include <linux/set_memory.h>
#endif

// Version-dependent definitions
#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 14, 0)
#define bin_attr_t const struct bin_attribute
#else
#define bin_attr_t struct bin_attribute
#endif

// =================================================================================================
// Global Variables
bool quick_and_dirty_mode = false;

long uarch_reset_rounds = UARCH_RESET_ROUNDS_DEFAULT;
bool enable_ssbp_patch = SSBP_PATCH_DEFAULT;
bool enable_prefetchers = PREFETCHER_DEFAULT;
char pre_run_flush = PRE_RUN_FLUSH_DEFAULT;
bool enable_hpa_gpa_collisions = HPA_GPA_COLLISIONS_DEFAULT;
measurement_mode_e measurement_mode = MEASUREMENT_MODE_DEFAULT;
bool dbg_gpr_mode = DBG_GPR_MODE_DEFAULT;

cpuinfo_t *cpuinfo = NULL;

// =================================================================================================
// Local declarations and definitions
#define SYSFS_DIRNAME "rvzr_executor"
static struct kobject *kobj_interface;

unsigned inputs_top = 0;
bool inputs_ready = false;
bool tc_ready = false;

bool unfinished_call = false;

// =================================================================================================
// SysFS interface to the module

/* warning! need write-all permission so overriding check */
#undef VERIFY_OCTAL_PERMISSIONS
#define VERIFY_OCTAL_PERMISSIONS(perms) (perms)

/// Reading hardware traces and performance counters
///
static ssize_t trace_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static struct kobj_attribute trace_attribute = __ATTR(trace, 0664, trace_show, NULL);

/// Loading a test case
///
static ssize_t test_case_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                               size_t count);
static struct kobj_attribute test_case_attribute = __ATTR(test_case, 0666, NULL, test_case_store);

static ssize_t test_case_bin_read(struct file *file, struct kobject *kobj, bin_attr_t *bin_attr,
                                  char *to, loff_t pos, size_t count);
static struct bin_attribute test_case_bin_attribute = __BIN_ATTR_RO(test_case_bin, 0);

/// Loading inputs
///
static ssize_t inputs_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                            size_t count);
static ssize_t inputs_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static struct kobj_attribute inputs_attribute = __ATTR(inputs, 0666, inputs_show, inputs_store);

/// Setting the number of warm up rounds
///
static ssize_t warmups_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static ssize_t warmups_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                             size_t count);
static struct kobj_attribute warmups_attribute = __ATTR(warmups, 0666, warmups_show, warmups_store);

/// Getting the data base address
///
static ssize_t print_data_base_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static struct kobj_attribute print_data_base_attribute =
    __ATTR(print_data_base, 0664, print_data_base_show, NULL);

/// Getting the base address of the memory region where the test case is loaded
///
static ssize_t print_code_base_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static struct kobj_attribute print_code_base_attribute =
    __ATTR(print_code_base, 0664, print_code_base_show, NULL);

/// Control SSBP patch
///
static ssize_t enable_ssbp_patch_store(struct kobject *kobj, struct kobj_attribute *attr,
                                       const char *buf, size_t count);
static struct kobj_attribute enable_ssbp_patch_attribute =
    __ATTR(enable_ssbp_patch, 0666, NULL, enable_ssbp_patch_store);

/// Control prefetchers
///
static ssize_t enable_prefetcher_store(struct kobject *kobj, struct kobj_attribute *attr,
                                       const char *buf, size_t count);
static struct kobj_attribute enable_prefetcher_attribute =
    __ATTR(enable_prefetcher, 0666, NULL, enable_prefetcher_store);

/// Control flushing
///
static ssize_t enable_pre_run_flush_store(struct kobject *kobj, struct kobj_attribute *attr,
                                          const char *buf, size_t count);
static struct kobj_attribute enable_pre_run_flush_attribute =
    __ATTR(enable_pre_run_flush, 0666, NULL, enable_pre_run_flush_store);

// Control virtual memory mapping
static ssize_t enable_hpa_gpa_collisions_store(struct kobject *kobj, struct kobj_attribute *attr,
                                               const char *buf, size_t count);
static struct kobj_attribute enable_hpa_gpa_collisions_attribute =
    __ATTR(enable_hpa_gpa_collisions, 0666, NULL, enable_hpa_gpa_collisions_store);

/// Measurement template selector
///
static ssize_t measurement_mode_store(struct kobject *kobj, struct kobj_attribute *attr,
                                      const char *buf, size_t count);
static struct kobj_attribute measurement_mode_attribute =
    __ATTR(measurement_mode, 0666, NULL, measurement_mode_store);

/// Q&D mode selector
///
static ssize_t enable_quick_and_dirty_mode(struct kobject *kobj, struct kobj_attribute *attr,
                                           const char *buf, size_t count);
static struct kobj_attribute enable_quick_and_dirty_mode_attribute =
    __ATTR(enable_quick_and_dirty_mode, 0666, NULL, enable_quick_and_dirty_mode);

/// Setting which faults should be handled within the test case
///
static ssize_t handled_faults_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static ssize_t handled_faults_store(struct kobject *kobj, struct kobj_attribute *attr,
                                    const char *buf, size_t count);
static struct kobj_attribute handled_faults_attribute =
    __ATTR(handled_faults, 0666, handled_faults_show, handled_faults_store);

/// Debug GPR mode selector
///
static ssize_t enable_dbg_gpr_mode(struct kobject *kobj, struct kobj_attribute *attr,
                                   const char *buf, size_t count);
static struct kobj_attribute enable_dbg_gpr_mode_attribute =
    __ATTR(enable_dbg_gpr_mode, 0666, NULL, enable_dbg_gpr_mode);

/// Debugging interface
///
static ssize_t dbg_dump_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf);
static struct kobj_attribute dbg_dump_attribute = __ATTR(dbg_dump_mode, 0666, dbg_dump_show, NULL);

static ssize_t dbg_guest_page_tables_show(struct kobject *kobj, struct kobj_attribute *attr,
                                          char *buf);
static struct kobj_attribute dbg_guest_page_tables_attribute =
    __ATTR(dbg_guest_page_tables, 0666, dbg_guest_page_tables_show, NULL);

static struct attribute *sysfs_attributes[] = {
    &trace_attribute.attr,
    &test_case_attribute.attr,
    &inputs_attribute.attr,
    &warmups_attribute.attr,
    &print_data_base_attribute.attr,
    &print_code_base_attribute.attr,
    &enable_ssbp_patch_attribute.attr,
    &enable_prefetcher_attribute.attr,
    &enable_pre_run_flush_attribute.attr,
    &measurement_mode_attribute.attr,
    &enable_quick_and_dirty_mode_attribute.attr,
    &enable_dbg_gpr_mode_attribute.attr,
    &handled_faults_attribute.attr,
    &dbg_dump_attribute.attr,
    &dbg_guest_page_tables_attribute.attr,
    &enable_hpa_gpa_collisions_attribute.attr,
    NULL, /* need to NULL terminate the list of attributes */
};

static struct bin_attribute *bin_sysfs_attributes[] = {
    &test_case_bin_attribute, //
    NULL,                     /* need to NULL terminate the list of attributes */
};

// =================================================================================================
// Implementation of the sysfs attributes

int next_measurement_id = -1;
static ssize_t trace_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    int count = 0;
    int retval = 0;

    ASSERT(measurements, "trace_show");
    ASSERT(input_parsing_completed(), "trace_show");
    ASSERT(tc_parsing_completed(), "trace_show");

    // start a new measurement?
    unfinished_call = true;
    if (next_measurement_id < 0) {
        int err = trace_test_case();
        if (err)
            return -EIO;

        // start printing the results
        next_measurement_id = n_inputs - 1;
    }
    unfinished_call = false;

    // print the results, but make sure we can continue later if we run out of space in buf
    for (; next_measurement_id >= 0; next_measurement_id--) {
        // check if the output buffer still has space
        if (count >= (4096 - 128))
            return count; // we will continue in the next call of this function

        measurement_t m = measurements[next_measurement_id];
        retval =
            sprintf(&buf[count], "%llu,%llu,%llu,%llu,%llu,%llu\n", m.htrace[0], m.pfc_reading[0],
                    m.pfc_reading[1], m.pfc_reading[2], m.pfc_reading[3], m.pfc_reading[4]);
        if (!retval)
            return -1;
        count += retval;
    }
    count += sprintf(&buf[count], "done\n");
    return count;
}

/// @brief Check if the parsed test case is compatible with the current CPU
/// @param void
/// @return 0 if the test case is compatible, -1 otherwise
static int check_test_case_compat(void)
{
    int err = 0;

#ifdef ARCH_X86_64
    if (test_case->features.includes_user_actors) {
#ifndef FORCE_SMAP_OFF
        // ensure that SMAP and SMEP are disabled
        uint64_t cr4 = __read_cr4();
        ASSERT(!(__read_cr4() & (X86_CR4_SMAP | X86_CR4_SMEP)), "test_case_store");
#endif
    }
    if (test_case->features.includes_vm_actors) {
        if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
            err = vmx_check_cpu_compatibility();
        } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
            err = svm_check_cpu_compatibility();
        }
        CHECK_ERR("vm_check_cpu_compatibility");
    }
#endif

    return err;
}

static ssize_t test_case_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                               size_t count)
{
    int err = 0;
    tc_ready = false;

    bool finished = false;
    ssize_t consumed_bytes = parse_test_case_buffer(buf, count, &finished);
    if (!finished) {
        return consumed_bytes;
    }

    // check if the given test case can be executed on this CPU
    err = check_test_case_compat();
    CHECK_ERR("check_test_case_compat");

    // prepare sandboxes
    err = allocate_sandbox();
    CHECK_ERR("allocate_sandbox");

    err = load_sandbox_code();
    CHECK_ERR("load_sandbox_code");

    next_measurement_id = -1;
    tc_ready = true;
    return consumed_bytes;
}

static ssize_t test_case_bin_read(struct file *file, struct kobject *kobj, bin_attr_t *bin_attr,
                                  char *to, loff_t pos, size_t count)
{
    loff_t max_pos = n_actors * sizeof(actor_code_t);
    if (pos > max_pos)
        return 0;

    loff_t chunk_end = pos + PAGE_SIZE;
    if (chunk_end > max_pos)
        chunk_end = max_pos;
    count = chunk_end - pos;
    memcpy(to, &loaded_test_case_entry[pos], count);
    return count;
}

static ssize_t inputs_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                            size_t count)
{
    bool finished = false;
    ssize_t consumed_bytes = parse_input_buffer(buf, count, &finished);
    inputs_ready = false;

    if (finished) {
        inputs_ready = true;
    }
    return consumed_bytes;
}

static ssize_t inputs_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    // FIXME: not implemented yet. See Flavien's branch for a reference implementation
    return sprintf(buf, "%d\n", inputs_ready);
}

static ssize_t warmups_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    return sprintf(buf, "%ld\n", uarch_reset_rounds);
}

static ssize_t warmups_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf,
                             size_t count)
{
    sscanf(buf, "%ld", &uarch_reset_rounds);
    return count;
}

static ssize_t print_data_base_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    return sprintf(buf, "%llx\n", (long long unsigned)&sandbox->data[0]);
}

static ssize_t print_code_base_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    return sprintf(buf, "%llx\n", (long long unsigned)loaded_test_case_entry);
}

static ssize_t enable_ssbp_patch_store(struct kobject *kobj, struct kobj_attribute *attr,
                                       const char *buf, size_t count)
{
    unsigned value = 0;
    sscanf(buf, "%u", &value);
    enable_ssbp_patch = (value == 0) ? false : true;
    return count;
}

static ssize_t enable_prefetcher_store(struct kobject *kobj, struct kobj_attribute *attr,
                                       const char *buf, size_t count)
{
    unsigned value = 0;
    sscanf(buf, "%u", &value);
    enable_prefetchers = (value == 0) ? false : true;
    return count;
}

static ssize_t enable_pre_run_flush_store(struct kobject *kobj, struct kobj_attribute *attr,
                                          const char *buf, size_t count)
{
    unsigned value = 0;
    sscanf(buf, "%u", &value);
    pre_run_flush = (value == 0) ? 0 : 1;
    return count;
}

static ssize_t enable_hpa_gpa_collisions_store(struct kobject *kobj, struct kobj_attribute *attr,
                                               const char *buf, size_t count)
{
    unsigned value = 0;
    sscanf(buf, "%u", &value);
    enable_hpa_gpa_collisions = (value == 0) ? false : true;
    return count;
}

static ssize_t measurement_mode_store(struct kobject *kobj, struct kobj_attribute *attr,
                                      const char *buf, size_t count)
{
    switch (buf[0]) {
    case 'P':
        if (buf[1] == '+')
            measurement_mode = PRIME_PROBE;
        else
            measurement_mode = PARTIAL_PRIME_PROBE;
        break;
    case 'F':
        measurement_mode = FLUSH_RELOAD;
        break;
    case 'E':
        measurement_mode = EVICT_RELOAD;
        break;
    case 'T':
        measurement_mode = TSC;
        break;
    default:
        PRINT_ERRS("measurement_mode_store", "Invalid measurement mode\n");
        return -1;
    }

    quick_and_dirty_mode = false; // updating the measurement mode resets the Q&D mode
    return count;
}

static ssize_t enable_quick_and_dirty_mode(struct kobject *kobj, struct kobj_attribute *attr,
                                           const char *buf, size_t count)
{

    unsigned value = 0;
    sscanf(buf, "%u", &value);
    if (value == 1 && quick_and_dirty_mode == false) {
        quick_and_dirty_mode = true;
        switch (measurement_mode) {
        case PRIME_PROBE:
            measurement_mode = FAST_PRIME_PROBE;
            break;
        case PARTIAL_PRIME_PROBE:
            measurement_mode = FAST_PARTIAL_PRIME_PROBE;
            break;
        default:
            break;
        }
    } else if (value == 0 && quick_and_dirty_mode == true) {
        quick_and_dirty_mode = false;
        switch (measurement_mode) {
        case FAST_PRIME_PROBE:
            measurement_mode = PRIME_PROBE;
            break;
        case FAST_PARTIAL_PRIME_PROBE:
            measurement_mode = PARTIAL_PRIME_PROBE;
            break;
        default:
            break;
        }
    }
    return count;
}

static ssize_t enable_dbg_gpr_mode(struct kobject *kobj, struct kobj_attribute *attr,
                                   const char *buf, size_t count)
{
    unsigned value = 0;
    sscanf(buf, "%u", &value);
    dbg_gpr_mode = (value == 0) ? false : true;
    return count;
}

static ssize_t handled_faults_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    return sprintf(buf, "0x%llx\n", (unsigned long long)handled_faults);
}

static ssize_t handled_faults_store(struct kobject *kobj, struct kobj_attribute *attr,
                                    const char *buf, size_t count)
{
    unsigned long long value;
    if (sscanf(buf, "%lld", &value) != 1)
        return -EINVAL;

    handled_faults = value | HANDLED_FAULTS_DEFAULT;
    return count;
}

/// Dump all global variables
///
static ssize_t dbg_dump_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
{
    int len = 0;
    len += sprintf(&buf[len], "n_actors: %lu\n", n_actors);
    len += sprintf(&buf[len], "test_case: 0x%llx\n", (uint64_t)test_case);
    len += sprintf(&buf[len], "loaded_test_case_entry: 0x%llx\n", (uint64_t)loaded_test_case_entry);
    len += sprintf(&buf[len], "measurements: 0x%llx\n", (uint64_t)measurements);
    len += sprintf(&buf[len], "n_inputs: %lu\n", n_inputs);
    len += sprintf(&buf[len], "inputs: %llx\n", (uint64_t)inputs);
    if (inputs) {
        len += sprintf(&buf[len], "inputs->metadata: %llx\n", (uint64_t)inputs->metadata);
        len += sprintf(&buf[len], "inputs->data: %llx\n", (uint64_t)inputs->data);
    }
    len += sprintf(&buf[len], "sandbox: %llx\n", (uint64_t)sandbox);
    len += sprintf(&buf[len], "fault_handler: %llx\n", (uint64_t)fault_handler);
    len += sprintf(&buf[len], "handled_faults: %u\n", handled_faults);
    len += sprintf(&buf[len], "quick_and_dirty_mode: %d\n", quick_and_dirty_mode);
    len += sprintf(&buf[len], "uarch_reset_rounds: %ld\n", uarch_reset_rounds);
    len += sprintf(&buf[len], "enable_ssbp_patch: %d\n", enable_ssbp_patch);
    len += sprintf(&buf[len], "enable_prefetchers: %d\n", enable_prefetchers);
    len += sprintf(&buf[len], "pre_run_flush: %d\n", pre_run_flush);
    return len;
}

/// Dump guest page tables into the kernel log
static ssize_t dbg_guest_page_tables_show(struct kobject *kobj, struct kobj_attribute *attr,
                                          char *buf)
{
    if (n_actors < 2)
        return sprintf(buf, "No actors to print tables for\n");

    int err = dbg_dump_guest_page_tables(1);
    if (err)
        return err;
    err = dbg_dump_ept(1);
    if (err)
        return err;
    return sprintf(buf, "done (see dmesg)\n");
}

// =================================================================================================
// Initialization and Memory Management
// =================================================================================================

/// @brief Get symbols for missing kernel functions
/// @param void
/// @return void
static inline void _get_required_kernel_functions(void)
{
#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 4, 0)
#ifdef KPROBE_LOOKUP
    typedef unsigned long (*kallsyms_lookup_name_t)(const char *name);
    kallsyms_lookup_name_t kallsyms_lookup_name;
    register_kprobe(&kp);
    kallsyms_lookup_name = (kallsyms_lookup_name_t)kp.addr;
    unregister_kprobe(&kp);
#endif // KPROBE_LOOKUP
    set_memory_x = (void *)kallsyms_lookup_name("set_memory_x");
    set_memory_nx = (void *)kallsyms_lookup_name("set_memory_nx");
    init_mm = *(struct mm_struct *)kallsyms_lookup_name("init_mm");
#endif // LINUX_VERSION_CODE >= KERNEL_VERSION(5, 4, 0)
}

/// @brief Get a description of the CPU
/// @param void
/// @return 0 on success, -1 on failure
static inline cpuinfo_t *get_cpuinfo(void)
{
#if defined(ARCH_X86_64)
    return &cpu_data(0);
#elif defined(ARCH_ARM)
    cpuinfo_t *cpuinfo = kmalloc(sizeof(cpuinfo_t), GFP_KERNEL);
    if (!cpuinfo) {
        return NULL;
    }

    uint64_t midr_el1 = 0;
    asm volatile("MRS %0, MIDR_EL1" : "=r"(midr_el1));
    cpuinfo->implementer = (midr_el1 >> 24) & 0xFF;
    cpuinfo->variant = (midr_el1 >> 20) & 0xF;
    cpuinfo->architecture = (midr_el1 >> 16) & 0xF;
    cpuinfo->part = (midr_el1 >> 4) & 0xFFF;
    cpuinfo->revision = midr_el1 & 0xF;

    return cpuinfo;
#endif
}

/// @brief Check if the CPU supports the required features
/// @param void
/// @return 0 on success, -1 on failure
static int check_cpu_compat(void)
{
#if defined(ARCH_X86_64)
    // Check CPU vendor
    if (cpuinfo->x86_vendor != X86_VENDOR_INTEL && cpuinfo->x86_vendor != X86_VENDOR_AMD) {
        printk(KERN_ERR "ERROR: rvzr_executor: This CPU vendor is not supported\n");
        return -1;
    }

    // Check that the CPU supports the required features
    if (!cpu_has(cpuinfo, X86_FEATURE_AVX) || !cpu_has(cpuinfo, X86_FEATURE_MMX)) {
        printk(KERN_ERR "ERROR: rvzr_executor: Executor KM requires AVX\n");
        return -1;
    }

    // Check memory configuration
    unsigned int phys_addr_width = cpuinfo->x86_phys_bits;
    if (phys_addr_width != PHYSICAL_WIDTH) {
        printk(KERN_ERR "rvzr_executor: ERROR: The width of physical addresses is %d instead of "
                        "expected %d\n",
               phys_addr_width, PHYSICAL_WIDTH);
        return -1;
    }
#elif defined(ARCH_ARM)
    // Nothing so far
#endif
    return 0;
}

static int __init executor_init(void)
{
    // Get CPU information and store in a global variable for future references
    cpuinfo = get_cpuinfo();
    if (!cpuinfo) {
        printk(KERN_ERR "rvzr_executor: Failed to get CPU information\n");
        return -ENOMEM;
    }

    // Check if the CPU supports the required features
    if (check_cpu_compat() != 0) {
        return -1;
    }

    // Make sure that we have all requirements
    _get_required_kernel_functions();

    // Initialize modules
    int err = 0;
    err |= init_measurements();
    err |= init_sandbox_manager();
    err |= init_code_loader();
    err |= init_data_loader();
    err |= init_input_parser();
    err |= init_test_case_parser();
    err |= init_fault_handler();
    err |= init_page_table_manager();
    err |= init_perf_counters();
    err |= init_special_register_manager();

#if VENDOR_ID == VENDOR_INTEL_
    err |= init_vmx();
#elif VENDOR_ID == VENDOR_AMD_
    err |= init_svm();
#endif
    CHECK_ERR("executor_init");

    // Create a pseudo file system interface
    kobj_interface = kobject_create_and_add(SYSFS_DIRNAME, kernel_kobj->parent);
    if (!kobj_interface) {
        printk(KERN_ERR "rvzr_executor: Failed to create a sysfs directory for x86-executor\n");
        return -ENOMEM;
    }

    // Create the files associated with this kobject
    // int retval = sysfs_create_group(kobj_interface, &attr_group);
    int i = 0;
    struct attribute *attr;
    for (attr = sysfs_attributes[i]; !err; i++) {
        attr = sysfs_attributes[i];
        if (attr == NULL)
            break;

        err = sysfs_create_file(kobj_interface, attr);
    }
    if (err != 0) {
        printk(KERN_ERR "rvzr_executor: Failed to create a sysfs group\n");
        kobject_put(kobj_interface);
        return err;
    }

    // Create binary attributes (used for passing large amounts of data)
    i = 0;
    struct bin_attribute *bin_attr;
    for (bin_attr = bin_sysfs_attributes[i]; !err; i++) {
        bin_attr = bin_sysfs_attributes[i];
        if (bin_attr == NULL)
            break;

        err = sysfs_create_bin_file(kobj_interface, bin_attr);
    }
    if (err != 0) {
        printk(KERN_ERR "rvzr_executor: Failed to create a binary sysfs files\n");
        kobject_put(kobj_interface);
        return err;
    }

    return 0;
}

static void __exit executor_exit(void)
{
    if (unfinished_call) {
        PRINT_ERR("CRITICAL ERROR: executor crashed while handling a sysfs call\n"
                  "Removing the module is no longer safe as it may lead to system blocking\n"
                  "Reboot to remove the module\n");
        return;
    }

    free_measurements();
    free_sandbox_manager();
    free_code_loader();
    free_data_loader();
    free_input_parser();
    free_test_case_parser();
    free_fault_handler();
    free_page_table_manager();
    free_perf_counters();
    free_special_register_manager();

#if VENDOR_ID == VENDOR_INTEL_
    free_vmx();
#elif VENDOR_ID == VENDOR_AMD_
    free_svm();
#endif

#if defined(ARCH_ARM)
    if (cpuinfo)
        kfree(cpuinfo);
#endif

    if (kobj_interface)
        kobject_put(kobj_interface);
}

module_init(executor_init);
module_exit(executor_exit);
MODULE_LICENSE("Dual MIT/GPL");
MODULE_AUTHOR("Oleksii Oleksenko");


================================================
FILE: rvzr/executor_km/measurement.c
================================================
/// File:
///  - Test case execution
///  - Ensuring an isolated environment
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "hardware_desc.h"
#include <asm/processor.h>

#include "code_loader.h"
#include "data_loader.h"
#include "input_parser.h"
#include "main.h"
#include "measurement.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

#include "fault_handler.h"
#include "page_tables_guest.h"
#include "page_tables_host.h"
#include "perf_counters.h"
#include "special_registers.h"

#ifdef ARCH_X86_64
#include <asm/msr-index.h>
#include <asm/msr.h>
#include <asm/spec-ctrl.h>

#include "svm.h"
#include "vmx.h"
#elif defined(ARCH_ARM)

#endif

measurement_t *measurements = NULL; // global

int run_experiment_outer(void); // inline asm label defined in <arch>/fault_handler.c

// =================================================================================================
// Local shortcut functions
// =================================================================================================

/// @brief Flushes the microarchitectural state
/// @param void
/// @return 0 on success, -1 on failure
static inline int uarch_flush(void)
{
#if VENDOR_ID == VENDOR_INTEL_ // Intel
    static const u16 ds = __KERNEL_DS;
    asm volatile("verw %[ds]" : : [ds] "m"(ds) : "cc");
#ifndef VMBUILD
    wrmsr64(MSR_IA32_FLUSH_CMD, L1D_FLUSH);
#endif
    asm volatile("wbinvd\n" : : :);
    asm volatile("lfence\n" : : :);
#elif VENDOR_ID == VENDOR_AMD_ // AMD
    asm volatile("wbinvd\n" : : :);
    asm volatile("lfence\n" : : :);
    // TBD
#endif
    return 0;
}

/// @brief Check if entry page of the test case is valid (present and executable)
/// @param void
/// @return 0 if the entry page is valid, -1 otherwise
static int check_test_case_entry(void)
{
    pte_t *tc_pte = get_pte((uint64_t)loaded_test_case_entry);
    if (!tc_pte || !pte_present(*tc_pte)) {
        return -1;
    }
#ifdef ARCH_X86_64
    if (!pte_exec(*tc_pte)) {
        return -1;
    }
#endif

    return 0;
}

/// @brief Checks the measurement status for corruption
/// @param status The measurement status structure to check
/// @return 0 on valid (non-corrupted) measurement, -1 on corrupted measurement
static int check_measurement_status(measurement_status_t *status)
{
    if (status->measurement_state != STATUS_ENDED) {
        switch (status->measurement_state) {
        case STATUS_UNINITIALIZED:
            PRINT_WARNS("run_experiment",
                        "Corrupted measurement: measurement_start macro was not executed, state=%d",
                        status->measurement_state);
            break;
        case STATUS_STARTED:
            PRINT_WARNS("run_experiment",
                        "Corrupted measurement: measurement_end macro was not executed, state=%d",
                        status->measurement_state);
            break;
        default:
            PRINT_WARNS("run_experiment", "Corrupted measurement: unknown state, state=%d",
                        status->measurement_state);
        }
        return -1;
    }

    if (status->smi_count != 0) {
        PRINT_WARNS("run_experiment", "Corrupted measurement: SMI detected, count=%d",
                    status->smi_count);
        return -1;
    }

    return 0;
}

/// @brief Check if the executor is ready to start measurements, and perform the necessary
///        setup of the CPU to ensure that the test case can be executed. Note that this function
///        only partially configures the CPU, and more will be done in set_execution_environment
/// @param irq_flags The flags to store the interrupt state
/// @return 0 on success, -1 on failure
static int pre_run(unsigned long *irq_flags)
{
    int err = 0;

    // check that all main data structures were allocated
    ASSERT(loaded_test_case_entry, "trace_test_case");
    ASSERT(check_test_case_entry() == 0, "trace_test_case");
    ASSERT(inputs, "trace_test_case");
    ASSERT(inputs->metadata, "trace_test_case");
    ASSERT(inputs->data, "trace_test_case");

    // Configure performance counters
    err |= pfc_configure();
    CHECK_ERR("trace_test_case:pfc_configure");

    // Enable FPU - just in case, we might use it within the test case
#ifdef ARCH_X86_64
    kernel_fpu_begin();
#endif

    // Prevent preemption
    get_cpu();

    unsigned long flags;
    raw_local_irq_save(flags);
    *irq_flags = flags;

    return err;
}

/// @brief Cleanup after the test case execution by undoing the changes made in pre_run
/// @param irq_flags The flags to restore the interrupt state
/// @return void
static inline void post_run(unsigned long *irq_flags)
{
#if VENDOR_ID == VENDOR_AMD_
    asm volatile("stgi\n"); // enable interrupts in case they were disabled
#endif
    unsigned long flags = *irq_flags;
    raw_local_irq_restore(flags);

    put_cpu();

#ifdef ARCH_X86_64
    kernel_fpu_end();
#endif
}

// =================================================================================================
// CPU state management
// =================================================================================================
/// @brief Stores the current state of the CPU and re-configures it for the test case execution
/// @param void
/// @return 0 on success, -1 on failure
static int set_execution_environment(void)
{
    int err = 0;
    err = set_special_registers();
    CHECK_ERR("set_execution_environment:set_special_registers");

    // If necessary, enable VM operation
#ifdef ARCH_X86_64
    if (test_case->features.includes_vm_actors) {
        if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
            err = start_vmx_operation();
            CHECK_ERR("set_execution_environment:start_vmx_operation");

            err = store_orig_vmcs_state();
            CHECK_ERR("set_execution_environment:store_orig_vmcs_state");

            err = set_vmcs_state();
            CHECK_ERR("set_execution_environment:set_vmcs_state");
        } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
            err = start_svm_operation();
            CHECK_ERR("set_execution_environment:start_svm_operation");

            err = store_orig_vmcb_state();
            CHECK_ERR("set_execution_environment:store_orig_vmcb_state");

            err = set_vmcb_state();
            CHECK_ERR("set_execution_environment:set_vmcb_state");
        }
    }
#endif
    return 0;
}

/// @brief Restores the CPU state to the state before the test case execution. This function is
/// written in a fail-safe manner, so that it can be called in fault handlers.
/// @param void
void recover_orig_state(void)
{
    // restore VMX state
#ifdef ARCH_X86_64
    if (test_case->features.includes_vm_actors) {
        if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
            // if (vmx_is_on)
            //     print_vmx_exit_info(); // uncomment to debug VMX exits
            restore_orig_vmcs_state();
            stop_vmx_operation();
        } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
            // if (svm_is_on)
            //     print_svm_exit_info(); // uncomment to debug SVM exits
            restore_orig_vmcb_state();
            stop_svm_operation();
        }
    }
#endif

    restore_faulty_page_permissions();
    restore_special_registers();
    restore_orig_sandbox_page_tables();
}

// =================================================================================================
// Measurement loop: trace_test_case -> run_experiment_outer -> run_experiment
// =================================================================================================

/// @brief Run a complete measurement experiment: setup the execution environment and execute
///        the loaded test case for each inputs, storing the resulting hardware traces and PFC
///        readings in the global `measurements` array
/// @param void
/// @return 0 on success, -1 on error
int run_experiment(void)
{
    int err = 0;

    // allocate and map memory for the test case
    err = set_sandbox_page_tables();
    if (err)
        goto cleanup;

    // configure the CPU (and anything else necessary) to prepare for the test case execution
    err = set_execution_environment();
    if (err)
        goto cleanup;

    // Zero-initialize the region of memory used by Prime+Probe
    if (!quick_and_dirty_mode)
        memset(&sandbox->util->l1d_priming_area[0], 0, L1D_PRIMING_AREA_SIZE * sizeof(char));

    // Try to reset the uarch state
    // (we do it here because from this point on the execution is expected to be deterministic
    // and depend solely on the test case and the input to it)
    if (pre_run_flush == 1 && !quick_and_dirty_mode)
        uarch_flush();

    long rounds = (long)n_inputs;
    for (long i = -uarch_reset_rounds; i < rounds; i++) {
        // ignore "warm-up" runs (i<0)uarch_reset_rounds
        long i_ = (i < 0) ? 0 : i;

        // Prepare sandbox
        load_sandbox_data(i_);
        set_faulty_page_permissions();

        // Catch all exceptions
        set_inner_fault_handlers();

        // Execute
        char *main_data = &sandbox->data[0].main_area[0];
        err = ((int (*)(char *))loaded_test_case_entry)(main_data);

        // Restore the original fault handlers and sandbox state
        unset_inner_fault_handlers();
        restore_faulty_page_permissions();
        if (err) // Note: this check HAS to be after IDT/PT reset to avoid corrupting system state
            goto cleanup;

        // Store the measurement
        measurement_t result = sandbox->util->vars.latest_measurement;
        measurements[i_].htrace[0] = result.htrace[0];
        memcpy(measurements[i_].pfc_reading, result.pfc_reading, sizeof(uint64_t) * NUM_PFC);

        // Post-process the measurement
        // (only in normal, non-debug non-warmup runs)
        if (i >= 0 && !dbg_gpr_mode) {
            // Check for measurement corruption
            if (check_measurement_status(&result.status) != 0)
                // Note: we intentionally do not set the `err` variable upon corruption, because
                // corruptions are expected to happen every once in a while because of SMIs,
                // and thus we want to handle them gracefully
                goto cleanup;

            // If the measurement is valid, set the upper bit of htrace
            // to distinguish correct htraces from corrupted ones
            measurements[i_].htrace[0] |= 1ULL << 63;
        }
    }

cleanup:
    if (err)
        measurements[0].htrace[0] = 0; // communicate the error up to executor.py
    recover_orig_state();
    CHECK_ERR("run_experiment:cleanup");
    return err;
}

/// @brief The outermost wrapper for the test case execution. Sets up performance counters,
///        configures the CPU, disables interrupts, and calls enter_unsafe_bubble
/// @param void
/// @return 0 on success, -1 on failure
int trace_test_case(void)
{
    int err = 0;
    unsigned long irq_flags = 0;

    err = alloc_measurements();
    CHECK_ERR("alloc_measurements");

    err = pre_run(&irq_flags);
    CHECK_ERR("trace_test_case:pre_run");

    if (n_inputs) {
        err |= run_experiment_outer();
    }

    post_run(&irq_flags);
    CHECK_ERR("trace_test_case:cleanup");

    return err;
}

// =================================================================================================
// Constructor and destructor + initialization
// =================================================================================================
int alloc_measurements(void)
{
    static int old_n_inputs = 0;
    if (n_inputs <= old_n_inputs)
        return 0;
    old_n_inputs = n_inputs;

    SAFE_VFREE(measurements);
    measurements = CHECKED_VMALLOC(n_inputs * sizeof(measurement_t));
    memset(measurements, 0, n_inputs * sizeof(measurement_t));
    return 0;
}

int init_measurements(void)
{
    measurements = CHECKED_VMALLOC(sizeof(measurement_t));
    return 0;
}

/// Destructor for the measurement module
///
void free_measurements(void) { SAFE_VFREE(measurements); }


================================================
FILE: rvzr/executor_km/page_tables_host.c
================================================
/// File:
///  - Page Table management
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/kernel.h>
#include <linux/mm.h>

#include "actor.h"
#include "hardware_desc.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

#include "page_tables_common.h"
#include "page_tables_host.h"

sandbox_pteps_t *sandbox_pteps;

static sandbox_ptes_t *orig_ptes;
static pte_t_ *faulty_ptes = NULL;

extern struct mm_struct init_mm;

pte_t *get_pte(uint64_t hva)
{
    // Make sure we are in vmalloc area
    if (!is_vmalloc_addr((void *)hva) && !virt_addr_valid((void *)hva)) {
        PRINT_ERR("get_pte: address not in vmalloc or kmalloc area");
        return NULL;
    }

    // Do a page walk
    pgd_t *pgdp = pgd_offset_k(hva);
    pgd_t pgd = READ_ONCE(*pgdp);
    if (pgd_none(pgd)) {
        PRINT_ERR("get_pte: pgd_none");
        return NULL;
    }

    p4d_t *p4dp = p4d_offset(pgdp, hva);
    p4d_t p4d = READ_ONCE(*p4dp);
    if (p4d_none(p4d)) {
        PRINT_ERR("get_pte: p4d_none");
        return NULL;
    }

    pud_t *pudp = pud_offset(p4dp, hva);
    pud_t pud = READ_ONCE(*pudp);
    if (pud_none(pud)) {
        PRINT_ERR("get_pte: pud_none");
        return NULL;
    }
    if (pud_bad(pud)) {
        PRINT_ERR("get_pte: pud_bad");
        return NULL;
    }

    pmd_t *pmdp = pmd_offset(pudp, hva);
    pmd_t pmd = READ_ONCE(*pmdp);
    if (pmd_none(pmd)) {
        PRINT_ERR("get_pte: pmd_none");
        return NULL;
    }
    if (pmd_bad(pmd)) {
        PRINT_ERR("get_pte: pmd_bad");
        return NULL;
    }

    pte_t *pte = pte_offset_kernel(pmdp, hva);
    ASSERT_ENULL(pte_present(*pte), "get_pte");

    return pte;
}

// =================================================================================================
// Manipulation of Host Page Tables
// =================================================================================================
/// @brief Cache the PTE pointers for all sandbox pages.
/// @param void
/// @return 0 on success, -1 on failure
int cache_host_pteps(void)
{
    ASSERT(sandbox_pteps != NULL, "cache_host_pteps");
    ASSERT(sandbox != NULL, "cache_host_pteps");

    static int old_n_actors = 1;
    if (n_actors > old_n_actors) {
        SAFE_FREE(sandbox_pteps->data_pteps);
        SAFE_FREE(sandbox_pteps->code_pteps);
        sandbox_pteps->data_pteps =
            CHECKED_ZALLOC(N_DATA_PAGES_PER_ACTOR * n_actors * sizeof(pte_t_ *));
        sandbox_pteps->code_pteps =
            CHECKED_ZALLOC(N_CODE_PAGES_PER_ACTOR * n_actors * sizeof(pte_t_ *));
    }
    old_n_actors = n_actors;

    // cache the PTE pointers for the util pages
    for (int i = 0; i < N_UTIL_PAGES; i++) {
        uint64_t va = (uint64_t)sandbox->util + i * PAGE_SIZE;
        pte_t *ptep = get_pte(va);
        ASSERT(ptep != NULL, "cache_host_pteps");
        sandbox_pteps->util_pteps[i] = (pte_t_ *)&ptep->pte;
    }

    // cache the PTE pointers for the code and data pages of the sandbox
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // cache the PTE pointers for the data pages of the actor
        for (int i = 0; i < N_DATA_PAGES_PER_ACTOR; i++) {
            uint64_t va = ((uint64_t)&sandbox->data[actor_id]) + i * PAGE_SIZE;
            pte_t *ptep = get_pte(va);
            ASSERT(ptep != NULL, "cache_host_pteps");
            sandbox_pteps->data_pteps[actor_id * N_DATA_PAGES_PER_ACTOR + i] = (pte_t_ *)&ptep->pte;
        }
        // cache the PTE pointers for the code pages of the actor
        for (int i = 0; i < N_CODE_PAGES_PER_ACTOR; i++) {
            uint64_t va = ((uint64_t)&sandbox->code[actor_id]) + i * PAGE_SIZE;
            pte_t *ptep = get_pte(va);
            ASSERT(ptep != NULL, "cache_host_pteps");
            sandbox_pteps->code_pteps[actor_id * N_CODE_PAGES_PER_ACTOR + i] = (pte_t_ *)&ptep->pte;
        }
    }
    return 0;
}

/// @brief Preserve the original PTEs for all sandbox pages.
/// @param void
/// @return 0 on success, -1 on failure
int store_orig_host_permissions(void)
{
    ASSERT(sandbox_pteps->util_pteps[0] != NULL, "store_orig_host_permissions");
    ASSERT(sandbox_pteps->data_pteps[0] != NULL, "store_orig_host_permissions");
    ASSERT(sandbox_pteps->code_pteps[0] != NULL, "store_orig_host_permissions");

    static int old_n_actors = 1;
    if (n_actors > old_n_actors) {
        SAFE_FREE(orig_ptes->data_ptes);
        SAFE_FREE(orig_ptes->code_ptes);
        orig_ptes->data_ptes = CHECKED_ZALLOC(N_DATA_PAGES_PER_ACTOR * n_actors * sizeof(pte_t_));
        orig_ptes->code_ptes = CHECKED_ZALLOC(N_CODE_PAGES_PER_ACTOR * n_actors * sizeof(pte_t_));

        SAFE_FREE(faulty_ptes);
        faulty_ptes = CHECKED_ZALLOC(sizeof(pte_t_) * n_actors);
    }
    old_n_actors = n_actors;

    // save the original PTEs for the util pages
    for (int i = 0; i < N_UTIL_PAGES; i++) {
        orig_ptes->util_ptes[i] = *sandbox_pteps->util_pteps[i];
    }

    // save the original PTEs for the code and data pages of the sandbox
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // save the original PTEs for the data pages of the actor
        for (int i = 0; i < N_DATA_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_DATA_PAGES_PER_ACTOR + i;
            orig_ptes->data_ptes[page_id] = *sandbox_pteps->data_pteps[page_id];
        }
        // save the original PTEs for the code pages of the actor
        for (int i = 0; i < N_CODE_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_CODE_PAGES_PER_ACTOR + i;
            orig_ptes->code_ptes[page_id] = *sandbox_pteps->code_pteps[page_id];
        }
    }
    return 0;
}

/// @brief A shortcut to restore the original PTEs for a single page.
/// @param ptep
/// @param old_pte
/// @param vaddr
static void restore_pte(pte_t_ *ptep, pte_t_ old_pte, uint64_t vaddr)
{
    uint64_t curr_pte_val = *(uint64_t *)ptep;
    uint64_t old_pte_val = *(uint64_t *)&old_pte;

    if (curr_pte_val != old_pte_val) {
        *ptep = old_pte;
        native_page_invalidate(vaddr);
    }
}

/// @brief Restore the original PTEs for all sandbox pages.
/// @param void
/// @return
int restore_orig_host_permissions(void)
{
    ASSERT(sandbox_pteps->util_pteps[0] != NULL, "restore_orig_host_permissions");
    ASSERT(sandbox_pteps->data_pteps[0] != NULL, "restore_orig_host_permissions");
    ASSERT(sandbox_pteps->code_pteps[0] != NULL, "restore_orig_host_permissions");

    // restore the original PTEs for the util pages
    for (int i = 0; i < N_UTIL_PAGES; i++) {
        restore_pte(sandbox_pteps->util_pteps[i], orig_ptes->util_ptes[i],
                    (uint64_t)sandbox->util + i * PAGE_SIZE);
    }

    // restore the original PTEs for the code and data pages of the sandbox
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // restore the original PTEs for the data pages of the actor
        for (int i = 0; i < N_DATA_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_DATA_PAGES_PER_ACTOR + i;
            restore_pte(sandbox_pteps->data_pteps[page_id], orig_ptes->data_ptes[page_id],
                        (uint64_t)&sandbox->data[actor_id] + i * PAGE_SIZE);
        }
        // restore the original PTEs for the code pages of the actor
        for (int i = 0; i < N_CODE_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_CODE_PAGES_PER_ACTOR + i;
            restore_pte(sandbox_pteps->code_pteps[page_id], orig_ptes->code_ptes[page_id],
                        (uint64_t)&sandbox->code[actor_id] + i * PAGE_SIZE);
        }
    }
    return 0;
}

/// @brief Configures the page table entries for those sandbox pages that are mapped into
/// user-type actors
/// @param void
/// @return 0 on success, -1 on failure
int set_user_pages(void)
{
    ASSERT(sandbox_pteps->util_pteps[0] != NULL, "restore_orig_host_permissions");
    ASSERT(sandbox_pteps->data_pteps[0] != NULL, "restore_orig_host_permissions");
    ASSERT(sandbox_pteps->code_pteps[0] != NULL, "restore_orig_host_permissions");

    // enable user access to util pages so that the actors can store measurement results
    for (int i = 0; i < N_UTIL_PAGES; i++) {
        set_user_bit(sandbox_pteps->util_pteps[i]);
        native_page_invalidate((uint64_t)sandbox->util + i * PAGE_SIZE);
    }

    // enable user access to code and data pages of the sandbox that belong to user actors
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-user actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->pl != PL_USER) {
            continue;
        }

        // configure PTEs for each area of the actor sandbox
        for (int i = 0; i < N_DATA_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_DATA_PAGES_PER_ACTOR + i;
            set_user_bit(sandbox_pteps->data_pteps[page_id]);
            native_page_invalidate((uint64_t)&sandbox->data[actor_id] + i * PAGE_SIZE);
        }
        for (int i = 0; i < N_CODE_PAGES_PER_ACTOR; i++) {
            int page_id = actor_id * N_CODE_PAGES_PER_ACTOR + i;
            set_user_bit(sandbox_pteps->code_pteps[page_id]);
            native_page_invalidate((uint64_t)&sandbox->code[actor_id] + i * PAGE_SIZE);
        }
    }

    return 0;
}

/// @brief Fast modification of the faulty page host PTE; sets the permissions according to
/// actor_t->data_permissions
/// @param void
void set_faulty_page_host_permissions(void)
{
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        uint64_t pte_mask = actors[actor_id].data_permissions;
        uint64_t mask_set = pte_mask & MODIFIABLE_PTE_BITS;
        uint64_t mask_clear = pte_mask | ~MODIFIABLE_PTE_BITS;

        int page_id = actor_id * N_DATA_PAGES_PER_ACTOR + FAULTY_PAGE_ID;
        pte_t_ *ptep = sandbox_pteps->data_pteps[page_id];
        faulty_ptes[actor_id] = *ptep;
        uint64_t org_value = *(uint64_t *)ptep;
        uint64_t pte = (org_value | mask_set) & mask_clear;
        // PRINT_ERR("set_faulty_page_host_permissions: actor %d, pte 0x%llx -> 0x%llx", actor_id,
        //   org_value, pte);

        if (pte != org_value) {
            *(uint64_t *)ptep = pte;
            native_page_invalidate((uint64_t)&sandbox->data[actor_id] + FAULTY_PAGE_ID * PAGE_SIZE);
        }
    }
}

/// @brief Fast recovery of original permissions of the faulty page host PTE
/// @param void
void restore_faulty_page_host_permissions(void)
{
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        int page_id = actor_id * N_DATA_PAGES_PER_ACTOR + FAULTY_PAGE_ID;
        *sandbox_pteps->data_pteps[page_id] = faulty_ptes[actor_id];
        native_page_invalidate((uint64_t)&sandbox->data[actor_id] + FAULTY_PAGE_ID * PAGE_SIZE);
    }
}

// =================================================================================================
int init_page_table_manager(void)
{
    orig_ptes = CHECKED_ZALLOC(sizeof(sandbox_ptes_t));
    orig_ptes->data_ptes = CHECKED_ZALLOC(N_DATA_PAGES_PER_ACTOR * sizeof(pte_t));
    orig_ptes->code_ptes = CHECKED_ZALLOC(N_CODE_PAGES_PER_ACTOR * sizeof(pte_t));
    orig_ptes->util_ptes = CHECKED_ZALLOC(N_UTIL_PAGES * sizeof(pte_t));

    sandbox_pteps = CHECKED_ZALLOC(sizeof(sandbox_pteps_t));
    sandbox_pteps->data_pteps = CHECKED_ZALLOC(N_DATA_PAGES_PER_ACTOR * sizeof(pte_t *));
    sandbox_pteps->code_pteps = CHECKED_ZALLOC(N_CODE_PAGES_PER_ACTOR * sizeof(pte_t *));
    sandbox_pteps->util_pteps = CHECKED_ZALLOC(N_UTIL_PAGES * sizeof(pte_t *));

    faulty_ptes = (pte_t_ *)CHECKED_ZALLOC(sizeof(pte_t_));
    return 0;
}

void free_page_table_manager(void)
{
    SAFE_FREE(sandbox_pteps->data_pteps);
    SAFE_FREE(sandbox_pteps->code_pteps);
    SAFE_FREE(sandbox_pteps->util_pteps);
    SAFE_FREE(sandbox_pteps);

    SAFE_FREE(orig_ptes->data_ptes);
    SAFE_FREE(orig_ptes->code_ptes);
    SAFE_FREE(orig_ptes->util_ptes);
    SAFE_FREE(orig_ptes);

    SAFE_FREE(faulty_ptes);
}


================================================
FILE: rvzr/executor_km/readme.md
================================================
# Install

See https://microsoft.github.io/side-channel-fuzzer/quick-start/ or `README.md` in the project root.

# Using the executor

Use the Revizor CLI (`revizor.py`).
This executor is not meant to be used standalone.

On your own peril, you could try using it directly, through the `/sys/rvzr_executor/` pseudo file system.
You can find an example of how to use it in `rvzr/tests/x86_tests/kernel_module.bats`.
But I promise you, there will come a point when your machine will crash or hang.
Better not.


================================================
FILE: rvzr/executor_km/sandbox_manager.c
================================================
/// File: Sandbox memory management
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "hardware_desc.h"

#include "actor.h"
#include "code_loader.h" // loaded_test_case_entry
#include "main.h"        // set_memory_x, set_memory_nx
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

#include "page_tables_guest.h"
#include "page_tables_host.h"

sandbox_t *sandbox = NULL; // global

// Util+Data allocation state (alloc_pages + vmap)
static struct {
    void *vaddr_unaligned;    // vmap'd virtual address (unaligned)
    void *vaddr_aligned;      // aligned to 2-page boundary
    struct page **page_array; // array of page pointers for vmap
    int num_pages;            // number of pages allocated
} util_data = {NULL, NULL, NULL, 0};

static void *code = NULL;
static size_t old_x_size = 0;

/// @brief Free util_data allocation (vmap + physical pages)
static void safe_free_util_data(void)
{
    if (util_data.vaddr_unaligned) {
        vunmap(util_data.vaddr_unaligned);
        util_data.vaddr_unaligned = NULL;
        util_data.vaddr_aligned = NULL;
    }
    if (util_data.page_array) {
        int order = get_order(util_data.num_pages * PAGE_SIZE);
        __free_pages(util_data.page_array[0], order);
        kfree(util_data.page_array);
        util_data.page_array = NULL;
    }
}

/// @brief Free code allocation (vmalloc)
static void safe_free_code(void)
{
    if (code) {
        set_memory_nx((unsigned long)code, old_x_size);
        SAFE_VFREE(code);
        loaded_test_case_entry = NULL;
    }
}

/// @brief Initialize sandbox pointers after allocation
/// @return 0 on success, -ENOMEM on failure
static int init_sandbox_pointers(void)
{
    if (!sandbox) {
        sandbox = CHECKED_MALLOC(sizeof(sandbox_t));
    }
    sandbox->data = (actor_data_t *)((unsigned long)util_data.vaddr_aligned + sizeof(util_t));
    sandbox->code = (actor_code_t *)code;
    sandbox->util = (util_t *)util_data.vaddr_aligned;
    loaded_test_case_entry = code;
    return 0;
}

/// @brief Allocate memory for the Util and Data areas of the sandbox
/// @details
/// Constraints:
/// 1. Physical Continuity - Prime+Probe attacks require contiguous physical pages for PIPT caches
/// 2. 4KB Page Tables - Executor must manipulate individual PTEs (impossible with huge pages)
/// 3. 8KB Alignment - Memory must be aligned to 2-page boundary
///
/// Solution: alloc_pages() + vmap()
/// - cannot use kmalloc: physically contiguous BUT uses huge pages in direct mapping
/// - cannot use vmalloc: uses 4KB PTEs BUT not physically contiguous
/// - solution -> alloc_pages + vmap: physically contiguous AND creates new 4KB page tables
///
/// @param n_actors Number of actors
/// @return 0 on success, -ENOMEM on failure
static int allocate_util_and_data(size_t n_actors)
{
    safe_free_util_data();

    // calculate required memory sizes
    const size_t util_mem_size = sizeof(util_t);
    const size_t data_mem_size = n_actors * sizeof(actor_data_t);
    const size_t mem_size = util_mem_size + data_mem_size;
    size_t alloc_size = mem_size + 0x1000; // add 4KB to ensure we can align to 8KB boundary
    util_data.num_pages = (alloc_size + PAGE_SIZE - 1) / PAGE_SIZE;
    int order = get_order(alloc_size);

    // allocate physical pages
    struct page *page = alloc_pages(GFP_KERNEL | __GFP_ZERO, order);
    if (!page) {
        PRINT_ERR("Error allocating util_and_data pages\n");
        return -ENOMEM;
    }

    // map the pages into kernel virtual address space
    util_data.page_array = kmalloc(util_data.num_pages * sizeof(struct page *), GFP_KERNEL);
    if (!util_data.page_array) {
        __free_pages(page, order);
        PRINT_ERR("Error allocating page array\n");
        return -ENOMEM;
    }

    for (int i = 0; i < util_data.num_pages; i++) {
        util_data.page_array[i] = page + i;
    }

    util_data.vaddr_unaligned =
        vmap(util_data.page_array, util_data.num_pages, VM_MAP, PAGE_KERNEL);
    if (!util_data.vaddr_unaligned) {
        kfree(util_data.page_array);
        __free_pages(page, order);
        util_data.page_array = NULL;
        PRINT_ERR("Error mapping util_and_data pages\n");
        return -ENOMEM;
    }

    // Align to 2-page (8KB) boundary
    unsigned long addr = (unsigned long)util_data.vaddr_unaligned;
    util_data.vaddr_aligned = (void *)ALIGN(addr, 0x2000);

    return 0;
}

/// @brief Allocate memory for the Code area of the sandbox
/// @details
/// Uses vmalloc (physical continuity not required). Provides 4KB page tables for PTE
/// manipulation and executable memory support via set_memory_x().
/// @param n_actors Number of actors (each gets its own code area)
/// @return 0 on success, error code on failure
static int allocate_code(size_t n_actors)
{
    safe_free_code();

    code = CHECKED_VMALLOC(n_actors * sizeof(actor_code_t));
    reset_code_area();

    size_t code_size = n_actors * sizeof(actor_code_t);
    old_x_size = DIV_ROUND_UP(code_size, PAGE_SIZE);
    set_memory_x((unsigned long)code, old_x_size);

    return 0;
}

/// @brief Clears out the code area from previous executions and fills the area with NOPs
/// @param void
/// @return void
void reset_code_area(void)
{
    // fill the code area with NOPs
#if defined(ARCH_X86_64)
    memset(code, 0x90, sizeof(actor_code_t) * n_actors);
#elif defined(ARCH_ARM)
    for (int i = 0; i < n_actors * sizeof(actor_code_t) / 4; i += 1)
        ((uint32_t *)code)[i] = 0xd503201f;
#endif

    // initialize the main section with a single ret instruction
#if defined(ARCH_X86_64)
    ((uint8_t *)code)[0] = '\xC3';
#elif defined(ARCH_ARM)
    ((uint32_t *)code)[0] = 0xd65f03c0;
#endif
}

int allocate_sandbox(void)
{
    int err = 0;
    static int old_n_actors = 1;

    // Allocate sandbox in host memory
    if (old_n_actors < n_actors) {
        err = allocate_util_and_data(n_actors);
        CHECK_ERR("allocate_util_and_data");

        err = allocate_code(n_actors);
        CHECK_ERR("allocate_code");

        err = init_sandbox_pointers();
        CHECK_ERR("init_sandbox_pointers");
    }

    // Make sure that everything is property initialized
    memset(util_data.vaddr_aligned, 0, sizeof(util_t) + n_actors * sizeof(actor_data_t));

    err = cache_host_pteps();
    CHECK_ERR("cache_host_pteps");

    // when necessary, map the sandbox into guest memory and allocate VM management data structures
    if (test_case->features.includes_vm_actors) {
        err = allocate_guest_page_tables();
        CHECK_ERR("allocate_guest_page_tables");

        err = map_sandbox_to_guest_memory();
        CHECK_ERR("map_sandbox_to_guest_memory");
    }
    old_n_actors = n_actors;

    return err;
}

/// @brief Returns the number of pages allocated for the sandbox, including util area, code and data
/// @param void
/// @return number of pages; -1 on error
int get_sandbox_size_pages(void)
{
    if (!sandbox)
        return -1;

    return DIV_ROUND_UP(sizeof(util_t), PAGE_SIZE) +
           DIV_ROUND_UP(sizeof(actor_data_t) * n_actors, PAGE_SIZE) +
           DIV_ROUND_UP(sizeof(actor_code_t) * n_actors, PAGE_SIZE);
}

/// @brief Sets PTE values for the sandbox based on the current test case configuration
/// @param void
/// @return 0 on success; -1 on error
int set_sandbox_page_tables(void)
{
    int err = store_orig_host_permissions();
    CHECK_ERR("store_orig_host_permissions");

    if (test_case->features.includes_user_actors) {
        err = set_user_pages();
        CHECK_ERR("set_user_pages");
    }
    return 0;
}

void restore_orig_sandbox_page_tables(void) { restore_orig_host_permissions(); }

/// @brief Fast modification of the faulty page PTE; sets the permissions according to
/// actor_t->data_permissions
void set_faulty_page_permissions(void)
{
    set_faulty_page_host_permissions();
    set_faulty_page_guest_permissions();
    set_faulty_page_ept_permissions();
}

/// @brief Fast recovery of original permissions of the faulty page PTE
void restore_faulty_page_permissions(void)
{
    restore_faulty_page_host_permissions();
    restore_faulty_page_guest_permissions();
    restore_faulty_page_ept_permissions();
}

// =================================================================================================
int init_sandbox_manager(void)
{
    int err = allocate_util_and_data(1);
    CHECK_ERR("allocate_util_and_data");

    err = allocate_code(1);
    CHECK_ERR("allocate_code");

    err = init_sandbox_pointers();
    CHECK_ERR("init_sandbox_pointers");

    // ensure that the main_area of the first actor is aligned as expected
    int offset = (unsigned long)sandbox->data[0].main_area % 0x2000;
    ASSERT(offset == 0, "init_sandbox_manager");

    // self-test: To enable offset-based accesses in assembly code, we have to hardcode
    //            the layout of the data structures in sandbox_constants.h;
    //            This naturally creates a risk of mismatches, so we perform sanity checks here
    //            to ensure that the layout is as expected.
    util_t *util = sandbox->util;
    ASSERT(&util->l1d_priming_area[0] - (uint8_t *)util == L1D_PRIMING_OFFSET, "init_sandbox");
    ASSERT((uint8_t *)&util->vars.stored_rsp - (uint8_t *)util == STORED_RSP_OFFSET,
           "init_sandbox");
    ASSERT((uint8_t *)&util->vars.latest_measurement - (uint8_t *)util == MEASUREMENT_OFFSET,
           "init_sandbox");
    actor_data_t *data = &sandbox->data[0];
    ASSERT(&data->main_area[0] - (uint8_t *)util == UTIL_REL_TO_MAIN, "init_sandbox");
    ASSERT(&data->main_area[0] - &data->macro_stack[64] == MACRO_STACK_TOP_OFFSET, "init_sandbox");
    ASSERT(&data->faulty_area[0] - &data->main_area[0] == FAULTY_AREA_OFFSET, "init_sandbox");
    ASSERT(&data->reg_init_area[0] - &data->main_area[0] == REG_INIT_OFFSET, "init_sandbox");
    ASSERT(&data->overflow_pad[0] - &data->main_area[0] == OVERFLOW_PAD_OFFSET, "init_sandbox");
    ASSERT(sizeof(measurement_t) == MEASUREMENT_SIZE, "init_sandbox");

    return 0;
}

void free_sandbox_manager(void)
{
    safe_free_util_data();
    safe_free_code();
    free_guest_page_tables();
}


================================================
FILE: rvzr/executor_km/test_case_parser.c
================================================
/// File:
///   - Parsing of test cases in RCBF format (see docs/devel/binary-formats.md)
///   - Management of TC-related data structures
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "test_case_parser.h"
#include "macro_expansion.h"
#include "main.h"
#include "shortcuts.h"

test_case_t *test_case = NULL;   // global
actor_metadata_t *actors = NULL; // global
size_t n_actors = 1;             // global

static size_t n_symbols;

static int new_test_case(test_case_t **test_case_p);

// =================================================================================================
// State machine for test case loading
// =================================================================================================
static bool _is_receiving_test_case = false;
static uint64_t _cursor = 0;
static size_t highest_n_actors = 0;
static size_t highest_n_symbols = 0;
static actor_metadata_t *_allocated_actor_table;
static tc_symbol_entry_t *_allocated_symbol_table;
static tc_section_metadata_entry_t *_allocated_metadata;
static tc_section_t *_allocated_data;

/// @brief Initialize the state machine
/// @param buf A pointer to the buffer containing (a portion of) the test case
/// @return Error code; 0 if successful
static int __batch_tc_parsing_start(const char *buf)
{
    int ret = 0;

    // Restart parsing
    _cursor = 0;

    // Create a new batch
    SAFE_FREE(test_case);
    if (new_test_case(&test_case) != 0) {
        PRINT_ERRS("__batch_tc_parsing_start", "Failed to create test case\n");
        return -ENOMEM;
    }

    // Get the number the number of actors
    uint64_t new_n_actors = ((uint64_t *)buf)[0];
    ASSERT(new_n_actors > 0, "__batch_tc_parsing_start");
    ret += 8;

    // Get the number of symbols
    uint64_t new_n_symbols = ((uint64_t *)buf)[1];
    ASSERT_MSG(new_n_symbols <= MAX_SYMBOLS, "__batch_tc_parsing_start",
               "n_symbols (%llu) > MAX_SYMBOLS (%u)\n", new_n_symbols, MAX_SYMBOLS);
    ret += 8;

    // Store object sizes
    test_case->actor_table_size = new_n_actors * sizeof(actor_metadata_t);
    test_case->symbol_table_size = new_n_symbols * sizeof(tc_symbol_entry_t);
    test_case->metadata_size = new_n_actors * sizeof(tc_section_metadata_entry_t);
    test_case->sections_size = new_n_actors * sizeof(tc_section_t);

    // Allocate memory for the test case
    if (new_n_symbols > highest_n_symbols || !_allocated_symbol_table) {
        SAFE_FREE(_allocated_symbol_table);
        // +1 to have a valid allocation if the test case is empty
        _allocated_symbol_table = CHECKED_MALLOC(test_case->symbol_table_size + 1);
        highest_n_symbols = new_n_symbols;
    }
    if (new_n_actors > highest_n_actors || !_allocated_data) {
        SAFE_FREE(_allocated_actor_table);
        SAFE_FREE(_allocated_metadata);
        SAFE_VFREE(_allocated_data);
        _allocated_actor_table = CHECKED_MALLOC(test_case->actor_table_size);
        _allocated_metadata = CHECKED_MALLOC(test_case->metadata_size);
        _allocated_data = CHECKED_VMALLOC(test_case->sections_size);
        highest_n_actors = new_n_actors;
    }

    // Reset the allocated memory
    memset(_allocated_actor_table, 0, highest_n_actors * sizeof(actor_metadata_t));
    memset(_allocated_symbol_table, 0, highest_n_symbols * sizeof(tc_symbol_entry_t));
    memset(_allocated_metadata, 0, highest_n_actors * sizeof(tc_section_metadata_entry_t));
    memset(_allocated_data, 0, highest_n_actors * sizeof(tc_section_t));

    test_case->actor_table = _allocated_actor_table;
    test_case->symbol_table = _allocated_symbol_table;
    test_case->metadata = _allocated_metadata;
    test_case->sections = _allocated_data;

    // set globals
    n_symbols = new_n_symbols;
    n_actors = new_n_actors;
    actors = test_case->actor_table;

    ASSERT(ret < PAGE_SIZE, "__batch_tc_parsing_start");
    return ret;
}

/// @brief Finalize parsing:
///        - do sanity checks
///        - set test case features
///        - type-check actor switch targets
/// @param void
/// @return Error code; 0 if successful
static int __batch_tc_parsing_end(void)
{
    // Make sure that macros in the symbol table are ordered by owner and offset;
    // the symbol table contains measurement start/end; and contains the main function at offset 0
    bool macros_ordered = true;
    bool has_start, has_end = false;
    bool has_main = false;
    tc_symbol_entry_t *prev_e = NULL;
    for (tc_symbol_entry_t *e = test_case->symbol_table; e < test_case->symbol_table + n_symbols;
         e++) {
        // check for start, end, and main
        if (e->id == MACRO_MEASUREMENT_START)
            has_start = true;
        if (e->id == MACRO_MEASUREMENT_END)
            has_end = true;
        if (e->owner == 0 && e->offset == 0)
            has_main = true;

        // check ordering
        if (prev_e && e->id != NONMACRO_FUNCTION && prev_e->id != NONMACRO_FUNCTION) {
            if (e->owner < prev_e->owner)
                macros_ordered = false;
            if (e->owner == prev_e->owner && e->offset < prev_e->offset)
                macros_ordered = false;
        }

        // check targets
        if (e->id == MACRO_SET_K2U_TARGET)
            ASSERT((actors[e->args & 0xFF].pl == PL_USER), "__batch_tc_parsing_end");
        if (e->id == MACRO_SET_U2K_TARGET)
            ASSERT((actors[e->args & 0xFF].pl == PL_KERNEL), "__batch_tc_parsing_end");
        if (e->id == MACRO_SET_H2G_TARGET)
            ASSERT((actors[e->args & 0xFF].mode == MODE_GUEST), "__batch_tc_parsing_end");
        if (e->id == MACRO_SET_G2H_TARGET)
            ASSERT((actors[e->args & 0xFF].mode == MODE_HOST), "__batch_tc_parsing_end");

        prev_e = e;
    }
    if (!macros_ordered) {
        PRINT_ERRS("__batch_tc_parsing_end", "Macros in the symbol table are not ordered\n");
        return -1;
    }
    if (!has_start || !has_end) {
        PRINT_ERRS("__batch_tc_parsing_end", "Symbol table does not contain measurement "
                                             "start/end\n");
        return -1;
    }
    if (!has_main) {
        PRINT_ERRS("__batch_tc_parsing_end", "Symbol table does not contain main function\n");
        return -1;
    }

    // Set test case features
    for (int i = 0; i < n_actors; i++) {
        if (actors[i].mode == MODE_GUEST) {
            test_case->features.includes_vm_actors = true;
            break;
        }
        if (actors[i].pl == PL_USER) {
            test_case->features.includes_user_actors = true;
            break;
        }
    }

    bool fault_handler_found = false;
    for (tc_symbol_entry_t *e = test_case->symbol_table; e < test_case->symbol_table + n_symbols;
         e++) {
        if (e->id == MACRO_FAULT_HANDLER) {
            fault_handler_found = true;
            break;
        }
    }
    test_case->features.has_explicit_fault_handler = fault_handler_found;
    return 0;
}

/// Parse the test case sent via sysfs in the RCBF format
/// (see docs/devel/binary-formats.md for details)
///
ssize_t parse_test_case_buffer(const char *buf, size_t count, bool *finished)
{
    ASSERT(*finished == false, "parse_test_case_buffer");

    static size_t curr_section_id = 0;
    static size_t curr_section_start = 0;
    static size_t curr_section_end = 0;
    ssize_t consumed_bytes = 0;
    ssize_t byte_id = 0;

    int actor_table_end = TC_HEADER_SIZE + test_case->actor_table_size;
    int symbol_table_end = actor_table_end + test_case->symbol_table_size;
    int metadata_end = symbol_table_end + test_case->metadata_size;

    if (!_is_receiving_test_case) // Starting a a new batch
    {
        consumed_bytes = __batch_tc_parsing_start(buf);
        if (consumed_bytes != TC_HEADER_SIZE) {
            PRINT_ERRS("parse_test_case_buffer", "Error parsing header\n");
            return -1;
        }

        _cursor += consumed_bytes;
        _is_receiving_test_case = true;
    } else if (_cursor < actor_table_end) // Parsing actor table
    {
        size_t at_cursor = _cursor - TC_HEADER_SIZE;
        for (; at_cursor < test_case->actor_table_size && byte_id < count;) {
            ((char *)test_case->actor_table)[at_cursor] = buf[byte_id];
            byte_id++;
            at_cursor++;
        }
        _cursor = at_cursor + TC_HEADER_SIZE;
        consumed_bytes = byte_id;
    } else if (_cursor < symbol_table_end) // Parsing symbol table
    {
        size_t st_cursor = _cursor - actor_table_end;
        for (; st_cursor < test_case->symbol_table_size && byte_id < count;) {
            ((char *)test_case->symbol_table)[st_cursor] = buf[byte_id];
            byte_id++;
            st_cursor++;
        }
        _cursor = st_cursor + actor_table_end;
        consumed_bytes = byte_id;
    } else if (_cursor < metadata_end) // Parsing metadata
    {
        size_t metadata_cursor = _cursor - symbol_table_end;
        for (; metadata_cursor < test_case->metadata_size && byte_id < count;) {
            ((char *)test_case->metadata)[metadata_cursor] = buf[byte_id];
            byte_id++;
            metadata_cursor++;
        }
        _cursor = metadata_cursor + symbol_table_end;
        consumed_bytes = byte_id;
    } else // Parsing data
    {
        if (curr_section_id == 0) {
            curr_section_start = metadata_end;
            curr_section_end = metadata_end + test_case->metadata[0].size;
        }
        // Check that the section is not too large
        if (test_case->metadata[curr_section_id].size > MAX_SECTION_SIZE) {
            PRINT_ERRS("parse_test_case_buffer", "Section size exceeds MAX_SECTION_SIZE\n");
            _is_receiving_test_case = false;
            return -1;
        }
        // printk(KERN_ERR "parse_test_case_buffer: curr_section_start = %lu; curr_section_end =
        // "
        //                 "%lu; curr_section_id = %lu\n",
        //        curr_section_start, curr_section_end, curr_section_id);

        size_t func_cursor = _cursor - curr_section_start;
        bool func_finished = false;
        for (; byte_id < count;) {
            test_case->sections[curr_section_id].code[func_cursor] = buf[byte_id];
            byte_id++;
            func_cursor++;
            if (func_cursor >= test_case->metadata[curr_section_id].size) {
                func_finished = true;
                break;
            }
        }
        _cursor = func_cursor + curr_section_start;
        consumed_bytes = byte_id;

        if (func_finished) {
            curr_section_id++;
            curr_section_start = curr_section_end;
            curr_section_end = curr_section_end + test_case->metadata[curr_section_id].size;
        }
    }

    // Check whether we are done
    if (curr_section_id >= n_actors) {
        curr_section_id = 0;
        curr_section_start = 0;
        curr_section_end = 0;

        _is_receiving_test_case = false;
        *finished = true;

        if (__batch_tc_parsing_end())
            return -1;

        ASSERT_MSG(consumed_bytes == count, "parse_test_case_buffer",
                   "consumed_bytes (%lu) != count (%lu)\n", consumed_bytes, count);
    }
    // printk(KERN_ERR "parse_test_case_buffer: consumed_bytes = %lu; count = %lu; _cursor =
    // %llu, " "fid: %ld, finished: %d\n",
    //    consumed_bytes, count, _cursor, curr_section_id, *finished);

    return consumed_bytes;
}

/// Getter for _is_receiving_test_case
///
bool tc_parsing_completed(void) { return !_is_receiving_test_case; }

// =================================================================================================

/// @brief Helper function to initialize a new test case with default values
/// @param test_case_p
/// @return 0 on success; -ENOMEM on error
static int new_test_case(test_case_t **test_case_p)
{
    test_case_t *tc = CHECKED_MALLOC(sizeof(test_case_t));
    memset(tc, 0, sizeof(test_case_t)); // zero out just in case

    tc->actor_table_size = sizeof(actor_metadata_t);
    tc->symbol_table_size = 0;
    tc->metadata_size = sizeof(tc_section_metadata_entry_t);
    tc->sections_size = sizeof(tc_section_t);
    tc->actor_table = _allocated_actor_table;
    tc->symbol_table = _allocated_symbol_table;
    tc->metadata = _allocated_metadata;
    tc->sections = _allocated_data;

    tc->features.includes_vm_actors = false;
    tc->features.includes_user_actors = false;
    tc->features.has_explicit_fault_handler = false;

    *test_case_p = tc;
    return 0;
}

int init_test_case_parser(void)
{
    // locals
    n_symbols = 0;
    _is_receiving_test_case = false;
    _cursor = 0;
    _allocated_actor_table = CHECKED_MALLOC(sizeof(actor_metadata_t));
    _allocated_symbol_table = CHECKED_MALLOC(1);
    _allocated_metadata = CHECKED_MALLOC(sizeof(tc_section_metadata_entry_t));
    _allocated_data = CHECKED_VMALLOC(sizeof(tc_section_t));

    // Dummy test case
    if (new_test_case(&test_case) != 0) {
        PRINT_ERRS("init_test_case_parser", "Failed to create test case\n");
        return -ENOMEM;
    }
    actors = test_case->actor_table;
    return 0;
}

void free_test_case_parser(void)
{
    SAFE_FREE(test_case);
    SAFE_FREE(_allocated_actor_table);
    SAFE_FREE(_allocated_symbol_table);
    SAFE_FREE(_allocated_metadata);
    SAFE_VFREE(_allocated_data);
    actors = NULL;
}


================================================
FILE: rvzr/executor_km/x86/asm_snippets.h
================================================
/// File: Building blocks for creating macros; x86-64
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef X86_ASM_SNIPPETS_H_
#define X86_ASM_SNIPPETS_H_
// clang-format off

#include "hardware_desc.h"
#include "measurement.h"
#include "registers.h"
#include <asm/msr-index.h>

#ifndef VENDOR_ID
#error "VENDOR_ID is not defined! Make sure to include this header late enough."
#endif

/// State machine of the tracing process
#define SET_SR_STARTED()       "mov "STATUS_REGISTER_8", "xstr(STATUS_STARTED)" \n"
#define SET_SR_ENDED()         "mov "STATUS_REGISTER_8", "xstr(STATUS_ENDED)" \n"


/// Accessors to MSRs
///
// clobber: rax, rcx, rdx
#define READ_MSR_START(ID, DEST)                          \
        "mov rcx, "ID"                           \n"      \
        "lfence; rdmsr; lfence                   \n"      \
        "shl rdx, 32; or rdx, rax                \n"      \
        "sub "DEST", rdx                         \n"

// clobber: rax, rcx, rdx
#define READ_MSR_END(ID, DEST)                            \
        "mov rcx, "ID"                           \n"      \
        "lfence; rdmsr; lfence                   \n"      \
        "shl rdx, 32; or rdx, rax                \n"      \
        "add "DEST", rdx                         \n"


/// Accessors to Performance Counters
///
// clobber: rax, rcx, rdx
#define READ_ONE_PFC(ID) \
        "mov rcx, "ID" \n"      \
        "lfence; rdpmc; lfence \n" \
        "shl rdx, 32; or rdx, rax \n"

// clobber: rax, rcx, rdx
#define READ_PFC_START() \
        READ_ONE_PFC("1") \
        "sub "PFC0", rdx \n" \
        READ_ONE_PFC("2") \
        "sub "PFC1", rdx \n" \
        READ_ONE_PFC("3") \
        "sub "PFC2", rdx \n"

// clobber: rax, rcx, rdx
#define READ_PFC_END() \
        READ_ONE_PFC("1") \
        "add "PFC0", rdx \n" \
        READ_ONE_PFC("2") \
        "add "PFC1", rdx \n" \
        READ_ONE_PFC("3") \
        "add "PFC2", rdx \n"


/// Detection of System Management Interrupts (SMIs)
///

/// @brief Clear the upper 32 bits of the STATUS_REGISTER
#define CLEAR_SMI_STATUS() \
   "mov "STATUS_REGISTER_32", "STATUS_REGISTER_32" \n"

#if VENDOR_ID == VENDOR_INTEL_
/// @brief Start monitoring SMIs by reading the current value of the SMI counter (MSR 0x34)
///        and storing it in the STATUS_REGISTER[63:32]
///  clobber: rax, rcx, rdx
#define READ_SMI_START()               \
    "mov rcx, "xstr(MSR_SMI_COUNT)"\n" \
    "lfence; rdmsr; lfence         \n" \
    "mov rcx, 0                    \n" \
    "sub ecx, eax                  \n" \
    "shl rcx, 32                   \n" \
    CLEAR_SMI_STATUS()                 \
    "or "STATUS_REGISTER", rcx     \n"

/// @brief End monitoring SMIs by reading the current value of the SMI counter (MSR 0x34)
///        and storing the difference between the current and the previous value
///        in the STATUS_REGISTER[31:0]
/// clobber: rax, rcx, rdx
#define READ_SMI_END()                 \
    "mov rcx, "xstr(MSR_SMI_COUNT)"\n" \
    "lfence; rdmsr; lfence         \n" \
    "mov rcx, "STATUS_REGISTER"    \n" \
    "shr rcx, 32                   \n" \
    "add ecx, eax                  \n" \
    "shl rcx, 32                   \n" \
    CLEAR_SMI_STATUS()                 \
    "or "STATUS_REGISTER", rcx     \n"
#elif VENDOR_ID == VENDOR_AMD_
/// @brief Start monitoring SMIs by reading the current value of the SMI counter (PMU ID 5)
///        and storing it in the STATUS_REGISTER[63:32]
///  clobber: rax, rcx, rdx
#define READ_SMI_START()            \
    "mov rcx, 5                 \n" \
    "lfence; rdpmc; lfence      \n" \
    "mov rcx, 0                 \n" \
    "sub ecx, eax               \n" \
    "shl rcx, 32                \n" \
    CLEAR_SMI_STATUS()              \
    "or "STATUS_REGISTER", rcx  \n"

/// @brief End monitoring SMIs by reading the current value of the SMI counter (PMU ID 5)
///        and storing the difference between the current and the previous value
///        in the STATUS_REGISTER[31:0]
/// clobber: rax, rcx, rdx
#define READ_SMI_END()              \
    "mov rcx, 5                 \n" \
    "lfence; rdpmc; lfence      \n" \
    "mov rcx, "STATUS_REGISTER" \n" \
    "shr rcx, 32                \n" \
    "add ecx, eax               \n" \
    "shl rcx, 32                \n" \
    CLEAR_SMI_STATUS()              \
    "or "STATUS_REGISTER", rcx  \n"

#endif


/// A sequence of instructions that attempts to set the pipeline to a uniform state,
/// regardless of the code that was executed before it. The idea is that if we execute
/// a whole bunch fences, it will give time for the uops that are currently in
/// the reservation station to get executed, and thus ensure that the test case
/// starts with an empty-ish pipeline
/// clobber: none
#define PIPELINE_RESET() asm volatile(""\
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n" \
    "lfence; lfence; lfence; lfence; lfence \n");

/// Register Loading
#if VENDOR_ID == 1 // Intel
#define SET_REGISTER_FROM_INPUT()\
    asm volatile("\n.intel_syntax noprefix\n" \
    "lea rsp, ["MEMORY_BASE_REG" + "xstr(REG_INIT_OFFSET)"]\n" \
    "pop rax \n" \
    "pop rbx \n" \
    "pop rcx \n" \
    "pop rdx \n" \
    "pop rsi \n" \
    "pop rdi \n" \
    "popfq \n" \
    "lea rsp, ["MEMORY_BASE_REG" + "xstr(LOCAL_RSP_OFFSET)"]\n" \
    "mov rbp, rsp \n" \
    ".att_syntax noprefix");

#elif VENDOR_ID == 2 // AMD
#define SET_REGISTER_FROM_INPUT()\
    asm volatile("\n.intel_syntax noprefix\n" \
    "lea rsp, ["MEMORY_BASE_REG" + "xstr(REG_INIT_OFFSET)"]\n" \
    "pop rax \n" \
    "pop rbx \n" \
    "pop rcx \n" \
    "pop rdx \n" \
    "pop rsi \n" \
    "pop rdi \n" \
    "popfq \n" \
    "lea rsp, ["MEMORY_BASE_REG" + "xstr(LOCAL_RSP_OFFSET)"]\n" \
    "mov rbp, rsp \n" \
    ".att_syntax noprefix");
#endif

// =================================================================================================
// L1D Prime+Probe
// =================================================================================================
// TODO: generate this code dynamically
#if L1D_ASSOCIATIVITY == 2
#define PRIME_ONE_SET(BASE, OFFSET, TMP)                 \
        "mov "TMP", "OFFSET"                ; mfence \n" \
        "add "TMP", ["BASE" + "TMP"]        ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 4096] ; mfence \n"

#define PROBE_ONE_SET(BASE, OFFSET)                  \
        "mov rax, "OFFSET"                       \n" \
        "add rax, ["BASE" + rax]        ; mfence \n" \
        "add rax, ["BASE" + rax + 4096] ; mfence \n"

#elif L1D_ASSOCIATIVITY == 4
#define PRIME_ONE_SET(BASE, OFFSET, TMP)                 \
        "mov "TMP", "OFFSET"                ; mfence \n" \
        "add "TMP", ["BASE" + "TMP"]        ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 4096] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 8192] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 12288]; mfence \n"

#define PROBE_ONE_SET(BASE, OFFSET)                  \
        "mov rax, "OFFSET"                       \n" \
        "add rax, ["BASE" + rax]        ; mfence \n" \
        "add rax, ["BASE" + rax + 4096] ; mfence \n" \
        "add rax, ["BASE" + rax + 8192] ; mfence \n" \
        "add rax, ["BASE" + rax + 12288]; mfence \n"

#elif L1D_ASSOCIATIVITY == 8
#define PRIME_ONE_SET(BASE, OFFSET, TMP)                 \
        "mov "TMP", "OFFSET"                ; mfence \n" \
        "add "TMP", ["BASE" + "TMP"]        ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 4096] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 8192] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 12288]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 16384]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 20480]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 24576]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 28672]; mfence \n"

#define PROBE_ONE_SET(BASE, OFFSET)                  \
        "mov rax, "OFFSET"                       \n" \
        "add rax, ["BASE" + rax]        ; mfence \n" \
        "add rax, ["BASE" + rax + 4096] ; mfence \n" \
        "add rax, ["BASE" + rax + 8192] ; mfence \n" \
        "add rax, ["BASE" + rax + 12288]; mfence \n" \
        "add rax, ["BASE" + rax + 16384]; mfence \n" \
        "add rax, ["BASE" + rax + 20480]; mfence \n" \
        "add rax, ["BASE" + rax + 24576]; mfence \n" \
        "add rax, ["BASE" + rax + 28672]; mfence \n"

#elif L1D_ASSOCIATIVITY == 12
#define PRIME_ONE_SET(BASE, OFFSET, TMP)                 \
        "mov "TMP", "OFFSET"                ; mfence \n" \
        "add "TMP", ["BASE" + "TMP"]        ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 4096] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 8192] ; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 12288]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 16384]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 20480]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 24576]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 28672]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 32768]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 36864]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 40960]; mfence \n" \
        "add "TMP", ["BASE" + "TMP" + 45056]; mfence \n"

#define PROBE_ONE_SET(BASE, OFFSET)                  \
        "mov rax, "OFFSET"                       \n" \
        "add rax, ["BASE" + rax]        ; mfence \n" \
        "add rax, ["BASE" + rax + 4096] ; mfence \n" \
        "add rax, ["BASE" + rax + 8192] ; mfence \n" \
        "add rax, ["BASE" + rax + 12288]; mfence \n" \
        "add rax, ["BASE" + rax + 16384]; mfence \n" \
        "add rax, ["BASE" + rax + 20480]; mfence \n" \
        "add rax, ["BASE" + rax + 24576]; mfence \n" \
        "add rax, ["BASE" + rax + 28672]; mfence \n" \
        "add rax, ["BASE" + rax + 32768]; mfence \n" \
        "add rax, ["BASE" + rax + 36864]; mfence \n" \
        "add rax, ["BASE" + rax + 40960]; mfence \n" \
        "add rax, ["BASE" + rax + 45056]; mfence \n"

#else
#error "Unexpected associativity"
#endif

// clobber: none
#define PRIME(BASE, OFFSET, TMP, COUNTER, REPS)                 \
        "mfence                                             \n" \
        "mov "COUNTER", "REPS"                              \n" \
        "   1: mov "OFFSET", 0                              \n" \
        "       2: lfence                                   \n" \
                PRIME_ONE_SET(BASE, OFFSET, TMP)                \
        "       add "OFFSET", 64                            \n" \
        "   cmp "OFFSET", 4096; jl 2b                       \n" \
        "dec "COUNTER"; jnz 1b                              \n" \
        "mfence;                                            \n"


// clobber: rax, rcx, rdx
#define PROBE_INTEL(BASE, OFFSET, TMP, DEST)            \
        "xor "DEST", "DEST"                         \n" \
        "xor "OFFSET", "OFFSET"                     \n" \
        "1: lfence                                  \n" \
        "   xor "TMP", "TMP"                        \n" \
            READ_ONE_PFC("0")                           \
        "   sub "TMP", rdx                          \n" \
            PROBE_ONE_SET(BASE, OFFSET)                 \
            READ_ONE_PFC("0")                           \
        "   add "TMP", rdx                          \n" \
        "   cmp "TMP", "xstr(L1D_ASSOCIATIVITY)"    \n" \
        "   jl 2f                                   \n" \
        "      shl "DEST", 1                        \n" \
        "      jmp 3f                               \n" \
        "   2:                                      \n" \
        "      shl "DEST", 1                        \n" \
        "      or "DEST", 1                         \n" \
        "   3:                                      \n" \
        "   add "OFFSET", 64                        \n" \
        "cmp "OFFSET", 4096; jl 1b                  \n"

// clobber: rax, rcx, rdx
#define PROBE_AMD(BASE, OFFSET, TMP, DEST)              \
        "xor "DEST", "DEST"                         \n" \
        "xor "OFFSET", "OFFSET"                     \n" \
        "1: lfence                                  \n" \
        "   xor "TMP", "TMP"                        \n" \
            READ_ONE_PFC("0")                           \
        "   sub "TMP", rdx                          \n" \
            PROBE_ONE_SET(BASE, OFFSET)                 \
            READ_ONE_PFC("0")                           \
        "   add "TMP", rdx                          \n" \
        "   cmp "TMP", 0; jg 2f                     \n" \
        "      shl "DEST", 1                        \n" \
        "      jmp 3f                               \n" \
        "   2:                                      \n" \
        "      shl "DEST", 1                        \n" \
        "      or "DEST", 1                         \n" \
        "   3:                                      \n" \
        "   add "OFFSET", 64                        \n" \
        "cmp "OFFSET", 4096; jl 1b                  \n"

#if VENDOR_ID == 1
#define PROBE(BASE, OFFSET, TMP, DEST) PROBE_INTEL(BASE, OFFSET, TMP, DEST)
#elif VENDOR_ID == 2
#define PROBE(BASE, OFFSET, TMP, DEST) PROBE_AMD(BASE, OFFSET, TMP, DEST)
#endif

// =================================================================================================
// Partial Prime+Probe (P+P applied to a subset of L1D instead the whole cache)
// =================================================================================================
#define PRIME_PARTIAL(BASE, OFFSET, TMP, COUNTER, REPS)         \
        "mfence                                             \n" \
        "mov "COUNTER", "REPS"                              \n" \
        "   1: mov "OFFSET", 0                              \n" \
        "       2: lfence                                   \n" \
                PRIME_ONE_SET(BASE, OFFSET, TMP)                \
        "       add "OFFSET", 64                            \n" \
        "   cmp "OFFSET", 3840; jl 2b                       \n" \
        "dec "COUNTER"; jnz 1b                              \n" \
        "mfence;                                            \n"

// =================================================================================================
// L1D Flush+Reload
// =================================================================================================

// clobber: none
#define FLUSH(BASE, OFFSET) \
        "mfence                                     \n" \
        "mov "OFFSET", 0                            \n" \
        "1: lfence                                  \n" \
        "   clflush qword ptr ["BASE" + "OFFSET"]   \n" \
        "   add "OFFSET", 64                        \n" \
        "cmp "OFFSET", 4096; jl 1b                  \n" \
        "mfence                                     \n"

// clobber: rax, rcx, rdx
#define RELOAD_INTEL(BASE, OFFSET, TMP, DEST)           \
        "xor "DEST", "DEST"                         \n" \
        "xor "OFFSET", "OFFSET"                     \n" \
        "1:                                         \n" \
        "   xor "TMP", "TMP"                        \n" \
            READ_ONE_PFC("0")                           \
        "   sub "TMP", rdx                          \n" \
        "   mov rax, qword ptr ["BASE" + "OFFSET"]  \n" \
            READ_ONE_PFC("0")                           \
        "   add "TMP", rdx                          \n" \
        "   cmp "TMP", 0; jne 2f                    \n" \
        "      shl "DEST", 1                        \n" \
        "      jmp 3f                               \n" \
        "   2:                                      \n" \
        "      shl "DEST", 1                        \n" \
        "      or "DEST", 1                         \n" \
        "   3:                                      \n" \
        "   add "OFFSET", 64                        \n" \
        "cmp "OFFSET", 4096; jl 1b                  \n"

// clobber: rax, rcx, rdx
#define RELOAD_AMD(BASE, OFFSET, TMP, DEST)             \
        "xor "DEST", "DEST"                         \n" \
        "xor "OFFSET", "OFFSET"                     \n" \
        "1:                                         \n" \
        "   xor "TMP", "TMP"                        \n" \
            READ_ONE_PFC("0")                           \
        "   sub "TMP", rdx                          \n" \
        "   mov rax, qword ptr ["BASE" + "OFFSET"]  \n" \
            READ_ONE_PFC("0")                           \
        "   add "TMP", rdx                          \n" \
        "   cmp "TMP", 0; je 2f                     \n" \
        "      shl "DEST", 1                        \n" \
        "      jmp 3f                               \n" \
        "   2:                                      \n" \
        "      shl "DEST", 1                        \n" \
        "      or "DEST", 1                         \n" \
        "   3:                                      \n" \
        "   add "OFFSET", 64                        \n" \
        "cmp "OFFSET", 4096; jl 1b                  \n"

#if VENDOR_ID == 1
#define RELOAD(BASE, OFFSET, TMP, DEST) RELOAD_INTEL(BASE, OFFSET, TMP, DEST)
#elif VENDOR_ID == 2
#define RELOAD(BASE, OFFSET, TMP, DEST) RELOAD_AMD(BASE, OFFSET, TMP, DEST)
#endif

// =================================================================================================
// Macro stack management
// =================================================================================================
/// @brief A sequence of instructions that switches the stack pointer to the macro stack
///        and pushes the flags and registers RAX, RBX, RCX, RDX
#define MACRO_PROLOGUE()                                                                           \
    "mov qword ptr ["MEMORY_BASE_REG" - " xstr(MACRO_STACK_TOP_OFFSET) " - 8], rsp\n"                            \
    "lea rsp, ["MEMORY_BASE_REG" - " xstr(MACRO_STACK_TOP_OFFSET) " - 8]\n"                                      \
    "push rax\n"                                                                                   \
    "push rbx\n"                                                                                   \
    "push rcx\n"                                                                                   \
    "push rdx\n"                                                                                   \
    "pushf\n"

/// @brief A sequence of instructions that pops the flags and registers RDX, RCX, RBX, RAX, RSP
///        and overwrites the popped memory addresses with zeros
#define MACRO_EPILOGUE()                                                                           \
    "popf\n"                                                                                       \
    "pop rdx\n"                                                                                    \
    "pop rcx\n"                                                                                    \
    "pop rbx\n"                                                                                    \
    "pop rax\n"                                                                                    \
    "mov qword ptr [rsp - 0x08], 0 \n"                                                             \
    "mov qword ptr [rsp - 0x10], 0 \n"                                                             \
    "mov qword ptr [rsp - 0x18], 0 \n"                                                             \
    "mov qword ptr [rsp - 0x20], 0 \n"                                                             \
    "mov qword ptr [rsp - 0x28], 0 \n"                                                             \
    "pop rsp\n"

// clang-format on
#endif // X86_ASM_SNIPPETS_H_


================================================
FILE: rvzr/executor_km/x86/entry_exit_points.h
================================================
/// File: Multiple variants of test case entry and exit points, for x86-64 architecture
///      used exclusively by code_loader.c
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

// -----------------------------------------------------------------------------------------------
// Note on registers.
// Some of the registers are reserved for a specific purpose and should never be overwritten.
// See ./docs/registers.md and registers.h for more information.

#ifndef RVZR_ENTRY_EXIT_H
#define RVZR_ENTRY_EXIT_H

#include "hardware_desc.h"

#include "asm_snippets.h"
#include "registers.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

#define TEMPLATE_START                     0x0fff379000000000
#define TEMPLATE_INSERT_TC                 0x0fff2f9000000000
#define TEMPLATE_DEFAULT_EXCEPTION_LANDING 0x0fff479000000000
#define TEMPLATE_END                       0x0fff279000000000
#define TEMPLATE_MARKER_SIZE               8

// clang-format off
static inline void prologue(void)
{
    // As we don't use a compiler to track clobbering,
    // we have to save the callee-saved regs
    asm_volatile_intel(
        "push rbx\n"
        "push rbp\n"
        "push r10\n"
        "push r11\n"
        "push r12\n"
        "push r13\n"
        "push r14\n"
        "push r15\n"
        "pushfq\n"

        // MEMORY_BASE_REG = main_area of actor 0
        // (passed in rdi, the first argument of measurement_code)
        "mov "MEMORY_BASE_REG", rdi\n"

        // UTIL_BASE_REG = sandbox->util
        "lea "UTIL_BASE_REG", ["MEMORY_BASE_REG" - "xstr(UTIL_REL_TO_MAIN)"]\n"

        // sandbox->util->stored_rsp = rsp
        "mov qword ptr ["UTIL_BASE_REG" + "xstr(STORED_RSP_OFFSET)"], rsp\n"

        // clear the rest of the registers
        "mov rax, 0\n"
        "mov rbx, 0\n"
        "mov rcx, 0\n"
        "mov rdx, 0\n"
        "mov rsi, 0\n"
        "mov rdi, 0\n"
        "mov r8,  0\n"
        "mov r9,  0\n"
        "mov r10, 0\n"
        "mov r11, 0\n"
        "mov r12, 0\n"
        "mov r13, 0\n"

        // initialize special registers
        "mov "HTRACE_REGISTER", 0\n"
        "mov "STATUS_REGISTER", "xstr(STATUS_UNINITIALIZED)"\n"

        "mov rbp, rsp\n"
        "sub rsp, 0x1000\n"

        // start monitoring interrupts
        READ_SMI_START()
    );

}

static inline void epilogue(void)
{
    asm_volatile_intel(
        // rbx <- SMI counter
        READ_SMI_END()

        // rax <- &latest_measurement
        "lea rax, ["UTIL_BASE_REG" + "xstr(MEASUREMENT_OFFSET)"]\n"

        // Store the results
        "mov qword ptr [rax + 0x00], "HTRACE_REGISTER" \n"  // HTrace
        "mov qword ptr [rax + 0x08], r10 \n"                // PFC0
        "mov qword ptr [rax + 0x10], r9 \n"                 // PFC1
        "mov qword ptr [rax + 0x18], r8 \n"                 // PFC2
        "mov qword ptr [rax + 0x20], 0 \n"                  // PFC3 (unused)
        "mov qword ptr [rax + 0x28], 0 \n"                  // PFC4 (unused)
        "mov qword ptr [rax + 0x30], "STATUS_REGISTER" \n"  // Measurement status

        // rsp = sandbox->util->stored_rsp
        "mov rsp, qword ptr ["UTIL_BASE_REG" + "xstr(STORED_RSP_OFFSET)"]\n"

        // restore registers
        "popfq\n"
        "pop r15\n"
        "pop r14\n"
        "pop r13\n"
        "pop r12\n"
        "pop r11\n"
        "pop r10\n"
        "pop rbp\n"
        "pop rbx\n"

        // return 0
        "mov rax, 0\n"
        "ret\n"
        "int3\n" // Silences objtool warnings about no int3 after ret
    );
}

static inline void epilogue_dbg_gpr(void)
{
    asm_volatile_intel(
        // r14 <- &latest_measurement
        // clobber r14; not in use anymore
        "lea r14, ["UTIL_BASE_REG" + "xstr(MEASUREMENT_OFFSET)"]\n"

        // Store the results
        "mov qword ptr [r14 + 0x00], rax\n"
        "mov qword ptr [r14 + 0x08], rbx\n"
        "mov qword ptr [r14 + 0x10], rcx\n"
        "mov qword ptr [r14 + 0x18], rdx\n"
        "mov qword ptr [r14 + 0x20], rsi\n"
        "mov qword ptr [r14 + 0x28], rdi\n"
        "mov qword ptr [r14 + 0x30], "STATUS_REGISTER"\n"

        // rsp = sandbox->util->stored_rsp
        "mov rsp, qword ptr ["UTIL_BASE_REG" + "xstr(STORED_RSP_OFFSET)"]\n"

        // restore registers
        "popfq\n"
        "pop r15\n"
        "pop r14\n"
        "pop r13\n"
        "pop r12\n"
        "pop r11\n"
        "pop r10\n"
        "pop rbp\n"
        "pop rbx\n"

        // return 0
        "mov rax, 0\n"
        "ret\n"
        "int3\n" // Silences objtool warnings about no int3 after ret
    );
}
// clang-format on

static void main_segment_template(void)
{
    asm volatile(".quad " xstr(TEMPLATE_START));
    prologue();

    SET_REGISTER_FROM_INPUT();
    PIPELINE_RESET();

    // test case placeholder
    asm volatile("\nlfence\n");
    asm volatile(".quad " xstr(TEMPLATE_INSERT_TC) "\n");
    asm volatile("\nmfence\n");

    // fault handler
    asm_volatile_intel(""
                       "jmp 1f\n"
                       ".quad " xstr(TEMPLATE_DEFAULT_EXCEPTION_LANDING) "\n"
                                                                         "1:nop; nop; nop\n");

    epilogue();
    asm volatile(".quad " xstr(TEMPLATE_END));
}

static void main_segment_template_dbg_gpr(void)
{
    asm volatile(".quad " xstr(TEMPLATE_START));
    prologue();

    SET_REGISTER_FROM_INPUT();
    PIPELINE_RESET();

    // test case placeholder
    asm volatile("\nlfence\n");
    asm volatile(".quad " xstr(TEMPLATE_INSERT_TC) "\n");
    asm volatile("\nmfence\n");

    asm_volatile_intel(""
                       "jmp 1f\n"
                       ".quad " xstr(TEMPLATE_DEFAULT_EXCEPTION_LANDING) "\n"
                                                                         "1:nop; nop; nop\n");

    epilogue_dbg_gpr();
    asm volatile(".quad " xstr(TEMPLATE_END));
}

#endif // RVZR_ENTRY_EXIT_H


================================================
FILE: rvzr/executor_km/x86/fault_handlers.S
================================================
// File: Low-level exception handling code for x86-64
//
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT
.intel_syntax noprefix

#include "sandbox_constants.h"
#include "registers.h"

.extern _printk
.extern set_outer_fault_handlers
.extern unset_outer_fault_handlers
.extern run_experiment
.extern recover_orig_state


// =================================================================================================
// Global variables
// =================================================================================================
.data

.global is_nested_fault
is_nested_fault:
.quad 0

fault_recovery_sp:
.quad 0

.Lrecovery_triggered_msg:
.asciz	"\0013[rvzr_executor:run_experiment_outer]\n\
ERROR: Recovery from fault triggered during run_experiment\n"
.align

.Lunreachable_msg:
.asciz	"\0013[rvzr_executor:rvzr_executor]\n\
ERROR: unreachable code\n"
.align

.Ltest_case_handler_msg:
.asciz	"\0013[rvzr_executor:test_case_handler]\n\
ERROR: Unhandled fault in the test case: \n\
    0 [Exception ID]:\t0x%llx\n\
    1 [Error code]:\t0x%llx\n\
    2 [RIP]:\t0x%llx\n\
    3 [CS]:\t0x%llx\n\
    4 [RFLAGS]:\t0x%llx\n\
    5 [RSP]:\t0x%llx\n\
Context:\n\
    R14: \t0x%llx\n\
    R15: \t0x%llx\n"
.align

.Lbubble_handler_msg:
.asciz	"\0013[rvzr_executor:bubble_handler]\n\
ERROR: Unexpected fault in run_experiment: \n\
    0 [Exception ID]:\t0x%llx\n\
    1 [Error code]:\t0x%llx\n\
    2 [RIP]:\t0x%llx\n\
    3 [CS]:\t0x%llx\n\
    4 [RFLAGS]:\t0x%llx\n\
    5 [RSP]:\t0x%llx\n\
Context:\n\
    run_experiment:\t\t0x%llx\n\
    run_experiment_outer:\t0x%llx\n"
.align

.Lnmi_handler_msg:
.asciz	"\0013[rvzr_executor:nmi_handler]\n\
ERROR: Unhandled NMI occurred during run_experiment\n"
.align

.Lnested_fault_msg:
.asciz	"\0013[rvzr_executor:nested_fault]\n\
ERROR: Nested fault detected\n"
.align

// =================================================================================================
// Macros
// =================================================================================================
.macro unreachable
    lea rdi, .Lunreachable_msg
    mov rsi, rcx
    call _printk
    hlt
.endm

// Generate entry stub for exception WITHOUT error code
.macro entry_stub_no_err name, id
.global \name\()_\id
.balign 16
\name\()_\id:
    push 0                // push dummy error code for stack normalization
    mov r13, 0x\id        // set exception ID in r13
    jmp \name             // jump to main handler
.endm

// Generate entry stub for exception WITH error code
.macro entry_stub_err name, id
.global \name\()_\id
.balign 16
\name\()_\id:
    mov r13, 0x\id        // set exception ID in r13 (error code already on stack)
    jmp \name             // jump to main handler
.endm

// C preprocessor macro: Helper to repeat a macro 16 times
#define CALL_16_TIMES(macro, arg, id)                                                              \
    macro arg, id##0; macro arg, id##1; macro arg, id##2; macro arg, id##3;                        \
    macro arg, id##4; macro arg, id##5; macro arg, id##6; macro arg, id##7;                        \
    macro arg, id##8; macro arg, id##9; macro arg, id##a; macro arg, id##b;                        \
    macro arg, id##c; macro arg, id##d; macro arg, id##e; macro arg, id##f;


// =================================================================================================
// Handlers
// =================================================================================================
.text

/// @brief The default handler for interrupts/exceptions that occur during the test case execution.
/// @param r13: error code
.global test_case_handler
.balign 4096
test_case_handler:
    // just in case, disable interrupts
    cli

    // check for nested faults
    lea rax, is_nested_fault
    cmp qword ptr [rax], 0
    jne .run_experiment_recovery  // nested fault detected -> go to recovery
    mov qword ptr [rax], 1        // no nested fault -> set the flag

    // Print error info:
    // Note: this function is called by the generated entry stubs (see entry_stub_* below),
    //       which set r13 to the exception ID
    //       and ensure that the stack layout is:
    //          - error code
    //          - RIP
    //          - CS
    //          - RFLAGS
    //          - RSP
    lea rdi, .Ltest_case_handler_msg  // format string
    mov rsi, r13                      // arg 1: Exception ID
    pop rdx                           // arg 2: Error code
    pop rcx                           // arg 3: RIP
    pop r8                            // arg 4: CS
    pop r9                            // arg 5: RFLAGS
    // arg 6+ are passed on stack
    pop rax
    push r15                          // arg 8: R15
    push r14                          // arg 7: R14
    push rax                          // arg 6: RSP
    xor eax, eax   // no vector registers used
    call _printk

    // ensure that the CPU state is properly restored before we exit
    call recover_orig_state

    jmp .run_experiment_recovery


/// @brief The default handler for interrupts/exceptions that occur inside the code called by
///        run_experiment_outer but outside of the test case itself.
.global bubble_handler
.balign 4096
bubble_handler:
    // just in case, disable interrupts
    cli

    // check for nested faults
    lea rax, is_nested_fault
    cmp qword ptr [rax], 0
    jne .run_experiment_recovery  // nested fault detected -> go to recovery
    mov qword ptr [rax], 1        // no nested fault -> set the flag

    // Print error info:
    // Note: this function is called by the generated entry stubs (see entry_stub_* below),
    //       which set r13 to the exception ID
    //       and ensure that the stack layout is:
    //          - error code
    //          - RIP
    //          - CS
    //          - RFLAGS
    //          - RSP
    lea rdi, .Lbubble_handler_msg     // format string
    mov rsi, r13                      // arg 1: Exception ID
    pop rdx                           // arg 2: Error code
    pop rcx                           // arg 3: RIP
    pop r8                            // arg 4: CS
    pop r9                            // arg 5: RFLAGS
    // arg 6+ are passed on stack
    pop r10                           // get RSP value
    lea r11, run_experiment           // get run_experiment address
    lea r12, run_experiment_outer     // get run_experiment_outer address
    push r12                          // arg 8: run_experiment_outer
    push r11                          // arg 7: run_experiment
    push r10                          // arg 6: RSP
    xor eax, eax   // no vector registers used
    call _printk
    add rsp, 16    // clean up stack (2 arguments)

    // ensure that the CPU state is properly restored before we exit
    call recover_orig_state

    jmp .run_experiment_recovery


/// @brief Universal NMI handler. Used by both Bubble and Test Case IDTs.
///        Prints a warning message and terminates the measurement.
///        Returns to the caller of unsafe_bubble_wrapper.
/// @param void
.global nmi_handler
.balign 4096
nmi_handler:
    // just in case, disable interrupts
    cli

    // flag that we had a fault
    mov qword ptr [is_nested_fault], 1

    // ensure that the stack pointer is valid
    lea rbx, fault_recovery_sp
    mov rbx, [rbx]
    mov rsp, rbx

    // print error message
    lea rdi, .Lnmi_handler_msg
    call _printk

    // go into recovery
    jmp .run_experiment_recovery


/// @brief Handler for nested faults.
///        Note: Revizor currently does not support handling of multiple faults in a single
///        test case execution. Thus, if a nested fault occurs, we simply print an error message
///        and terminate the measurement.
/// @param void
.global nested_fault_handler
.balign 4096
nested_fault_handler:
    // just in case, disable interrupts
    cli

    // print error message
    lea rdi, .Lnested_fault_msg
    call _printk

    // go into recovery
    jmp .run_experiment_recovery


// =================================================================================================
// Multi-entry handler generation
// =================================================================================================
// This section generates 256 individual entry stubs for each handler (test_case_handler and
// bubble_handler). Each stub normalizes the stack layout (ensures error code is present) and
// passes the exception ID in r13 before jumping to the main handler.
//
// Exceptions that push error codes: 0x08, 0x0a-0x0e, 0x11, 0x15, 0x1d, 0x1e
// For exceptions WITHOUT error code, we push a dummy 0 to normalize the stack layout.
.text

// Generate all 256 entry stubs for test_case_handler
entry_stub_no_err test_case_handler, 00
entry_stub_no_err test_case_handler, 01
entry_stub_no_err test_case_handler, 02
entry_stub_no_err test_case_handler, 03
entry_stub_no_err test_case_handler, 04
entry_stub_no_err test_case_handler, 05
entry_stub_no_err test_case_handler, 06
entry_stub_no_err test_case_handler, 07
entry_stub_err test_case_handler, 08
entry_stub_no_err test_case_handler, 09
entry_stub_err test_case_handler, 0a
entry_stub_err test_case_handler, 0b
entry_stub_err test_case_handler, 0c
entry_stub_err test_case_handler, 0d
entry_stub_err test_case_handler, 0e
entry_stub_no_err test_case_handler, 0f
entry_stub_no_err test_case_handler, 10
entry_stub_err test_case_handler, 11
entry_stub_no_err test_case_handler, 12
entry_stub_no_err test_case_handler, 13
entry_stub_no_err test_case_handler, 14
entry_stub_err test_case_handler, 15
entry_stub_no_err test_case_handler, 16
entry_stub_no_err test_case_handler, 17
entry_stub_no_err test_case_handler, 18
entry_stub_no_err test_case_handler, 19
entry_stub_no_err test_case_handler, 1a
entry_stub_no_err test_case_handler, 1b
entry_stub_no_err test_case_handler, 1c
entry_stub_err test_case_handler, 1d
entry_stub_err test_case_handler, 1e
entry_stub_no_err test_case_handler, 1f
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 2)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 3)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 4)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 5)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 6)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 7)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 8)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, 9)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, a)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, b)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, c)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, d)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, e)
CALL_16_TIMES(entry_stub_no_err, test_case_handler, f)

// Generate all 256 entry stubs for bubble_handler
entry_stub_no_err bubble_handler, 00
entry_stub_no_err bubble_handler, 01
entry_stub_no_err bubble_handler, 02
entry_stub_no_err bubble_handler, 03
entry_stub_no_err bubble_handler, 04
entry_stub_no_err bubble_handler, 05
entry_stub_no_err bubble_handler, 06
entry_stub_no_err bubble_handler, 07
entry_stub_err bubble_handler, 08
entry_stub_no_err bubble_handler, 09
entry_stub_err bubble_handler, 0a
entry_stub_err bubble_handler, 0b
entry_stub_err bubble_handler, 0c
entry_stub_err bubble_handler, 0d
entry_stub_err bubble_handler, 0e
entry_stub_no_err bubble_handler, 0f
entry_stub_no_err bubble_handler, 10
entry_stub_err bubble_handler, 11
entry_stub_no_err bubble_handler, 12
entry_stub_no_err bubble_handler, 13
entry_stub_no_err bubble_handler, 14
entry_stub_err bubble_handler, 15
entry_stub_no_err bubble_handler, 16
entry_stub_no_err bubble_handler, 17
entry_stub_no_err bubble_handler, 18
entry_stub_no_err bubble_handler, 19
entry_stub_no_err bubble_handler, 1a
entry_stub_no_err bubble_handler, 1b
entry_stub_no_err bubble_handler, 1c
entry_stub_err bubble_handler, 1d
entry_stub_err bubble_handler, 1e
entry_stub_no_err bubble_handler, 1f
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 2)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 3)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 4)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 5)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 6)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 7)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 8)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, 9)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, a)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, b)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, c)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, d)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, e)
CALL_16_TIMES(entry_stub_no_err, bubble_handler, f)


// =================================================================================================
// run_experiment_outer: Fault-tolerant wrapper for run_experiment
// =================================================================================================
.text

/// @brief A wrapper over run_experiment that ensures that any bugs that cause an
///        exception will be handled gracefully and won't crash the system
/// @param void
.global run_experiment_outer
.balign 4096
run_experiment_outer:
    // A bug in run_experiment may corrupt the CPU state, so we need to save the current state
    // before calling run_experiment
    push rbx
    push rcx
    push rdx
    push rsi
    push rdi
    push r8
    push r9
    push r10
    push r11
    push r12
    push r13
    push r14
    push r15
    push rbp
    mov rbp, rsp

    // Save the SP into a global variables so that we can recover it after a destructive bug
    lea rax, fault_recovery_sp
    mov [rax], rsp

    // Disable interrupts to avoid nested faults (should already be disabled but just in case)
    cli

    // Set up outer fault handlers
    call set_outer_fault_handlers

    // Run the measurements
    call run_experiment
    jmp .run_experiment_normal_exit

.run_experiment_recovery:
    // START CRITICAL SECTION
    // Note: this section is used to recover from bugs in the executor with possible full corruption
    // of the memory and register state. Thus, the code below has to make as few assumptions
    // as possible, and also be very careful about memory accesses.

    // Overwrite SP with fault_recovery_sp
    lea rbx, fault_recovery_sp
    mov rbx, [rbx]
    mov rsp, rbx

    // Print an error message
    lea rdi, .Lrecovery_triggered_msg
    call _printk

    // Return error code 1
    mov rax, 1

    jmp .run_experiment_normal_exit
    // END CRITICAL SECTION

.run_experiment_normal_exit:
    // preserve err (rax)
    push rax

    // Restore original fault handlers
    call unset_outer_fault_handlers
    pop rax  // restore err

    // Restore the original CPU state
    pop rbp
    pop r15
    pop r14
    pop r13
    pop r12
    pop r11
    pop r10
    pop r9
    pop r8
    pop rdi
    pop rsi
    pop rdx
    pop rcx
    pop rbx

    ret
    unreachable


================================================
FILE: rvzr/executor_km/x86/idt.c
================================================
/// File:
///  - Fault handling and IDT management
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/interrupt.h>

#include "code_loader.h"
#include "hardware_desc.h"
#include "main.h"
#include "measurement.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "test_case_parser.h"

#include "fault_handler.h"

uint32_t handled_faults = 0;          // global
char *fault_handler = NULL;           // global
struct desc_ptr test_case_idtr = {0}; // global

static gate_desc *bubble_idt = NULL;
static gate_desc *test_case_idt = NULL;

static struct desc_ptr orig_idtr = {0};
static struct desc_ptr bubble_idtr = {0};

// Declarations from fault_handlers.S
void test_case_handler(void);
void bubble_handler(void);
void nmi_handler(void);
extern uint64_t is_nested_fault;

#define BIT_CHECK(a, b) (!!((a) & (1ULL << (b))))

// =================================================================================================
// Handler declarations and lists
// =================================================================================================
// The 256 entry stubs for each handler are generated in fault_handlers.S using assembly macros.
// Here we only declare them and create arrays of pointers for IDT initialization.

#define MULTI_ENTRY_HANDLER_DECLARATIONS_ID(name, id) void name##_##id(void);
#define MULTI_ENTRY_HANDLER_DECLARATIONS(name)                                                     \
    CALL_256_TIMES(MULTI_ENTRY_HANDLER_DECLARATIONS_ID, name)

#define MULTI_ENTRY_HANDLER_LIST_ID(name, id) name##_##id,
#define MULTI_ENTRY_HANDLER_LIST(name)        CALL_256_TIMES(MULTI_ENTRY_HANDLER_LIST_ID, name)

MULTI_ENTRY_HANDLER_DECLARATIONS(test_case_handler);
static void *test_case_handlers[] = {
    MULTI_ENTRY_HANDLER_LIST(test_case_handler) NULL,
};

MULTI_ENTRY_HANDLER_DECLARATIONS(bubble_handler);
static void *bubble_handlers[] = {
    MULTI_ENTRY_HANDLER_LIST(bubble_handler) NULL,
};

// =================================================================================================
// IDT management
// =================================================================================================
inline static void native_sidt(void *dtr)
{
    asm volatile("sidt %0\n mfence\n" : "=m"(*((struct desc_ptr *)dtr)));
}

inline static void native_lidt(void *dtr)
{
    asm volatile("lidt %0\n mfence\n" ::"m"(*((struct desc_ptr *)dtr)));
}

static void set_intr_gate_default(gate_desc *idt, int interrupt_id, void *handler)
{
    gate_desc desc = {
        .offset_low = (u16)(unsigned long)handler,
        .segment = __KERNEL_CS,
        .bits = (struct idt_bits){.ist = 0, .zero = 0, .type = GATE_INTERRUPT, .dpl = 0, .p = 1},
        .offset_middle = (u16)((unsigned long)handler >> 16),
        .offset_high = (u32)((unsigned long)handler >> 32),
        .reserved = 0,
    };
    write_idt_entry(idt, interrupt_id, &desc);
}

static void idt_set_custom_handlers(gate_desc *idt, struct desc_ptr *idtr, void *main_handler,
                                    void **secondary_handlers)
{
    for (int idx = 0; idx < 256; idx++) {
        if (idx == X86_TRAP_NMI) {
            set_intr_gate_default(idt, idx, nmi_handler);
            continue;
        }

        if (main_handler != NULL && idx < 32 && BIT_CHECK(handled_faults, idx)) {
            set_intr_gate_default(idt, idx, main_handler);
            continue;
        }

        switch (idx) {
        // if we ever get a machine check exception, the CPU is definitely in a bad state
        // so we should let OS handle it
        case X86_TRAP_DF:
        case X86_TRAP_MC: {
            // case 22 ... 31: {
            gate_desc *org_handler = &((gate_desc *)orig_idtr.address)[idx];
            write_idt_entry(idt, idx, org_handler);
            break;
        }
        default:
            // all other exceptions are dispatched to the secondary handler
            set_intr_gate_default(idt, idx, secondary_handlers[idx]);
            break;
        }
    }
    idtr->address = (unsigned long)idt;
    idtr->size = (sizeof(gate_desc) * 256) - 1;
    native_lidt(idtr);
}

void set_outer_fault_handlers(void)
{
    native_sidt(&orig_idtr); // preserve original IDT
    idt_set_custom_handlers(bubble_idt, &bubble_idtr, NULL, bubble_handlers);
    is_nested_fault = 0;
}

void unset_outer_fault_handlers(void)
{
    if (orig_idtr.address != 0) {
        native_lidt(&orig_idtr); // restore original IDT
    } else {
        PRINT_ERR("unset_outer_fault_handlers: original IDT is not set\n");
    }
}

void set_inner_fault_handlers(void)
{
    idt_set_custom_handlers(test_case_idt, &test_case_idtr, fault_handler, test_case_handlers);
    is_nested_fault = 0;
}

void unset_inner_fault_handlers(void)
{
    if (bubble_idtr.address != 0) {
        native_lidt(&bubble_idtr); // restore bubble IDT
    } else {
        PRINT_ERR("unset_inner_fault_handlers: bubble IDT is not set\n");
    }
}

// =================================================================================================
int init_fault_handler(void)
{
    fault_handler = (void *)test_case_handler;

    bubble_idt = CHECKED_ZALLOC(sizeof(gate_desc) * 256);
    test_case_idt = CHECKED_ZALLOC(sizeof(gate_desc) * 256);
    test_case_idtr.address = (unsigned long)test_case_idt;
    return 0;
}

void free_fault_handler(void)
{
    SAFE_FREE(bubble_idt);
    SAFE_FREE(test_case_idt);
}


================================================
FILE: rvzr/executor_km/x86/macros.c
================================================
/// File: x86 implementation of various macros as well as x86-specific code for
///       the macro loader (macro_expansion.c)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "asm_snippets.h"
#include "fault_handler.h"
#include "macro_expansion.h"
#include "main.h"
#include "page_tables_guest.h"
#include "page_tables_host.h"
#include "registers.h"
#include "sandbox_manager.h"
#include "shortcuts.h"
#include "svm.h"
#include "vmx.h"

extern uint64_t is_nested_fault; // defined in fault_handlers.S
void nested_fault_handler(void); // defined in fault_handlers.S

// =================================================================================================
// Convenience shortcuts for writing constants to memory
// =================================================================================================
#define APPEND_U8_TO_DEST(value) dest[cursor++] = value;

#define APPEND_U16_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint16_t *)(dest + cursor)) = value;                                                    \
        cursor += 2;                                                                               \
    }

#define APPEND_U32_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint32_t *)(dest + cursor)) = value;                                                    \
        cursor += 4;                                                                               \
    }

#define APPEND_U64_TO_DEST(value)                                                                  \
    {                                                                                              \
        *((uint64_t *)(dest + cursor)) = value;                                                    \
        cursor += 8;                                                                               \
    }

#define APPEND_BYTES_TO_DEST(...)                                                                  \
    {                                                                                              \
        static const uint8_t bytes[] = {__VA_ARGS__};                                              \
        for (size_t i = 0; i < sizeof(bytes); i++) {                                               \
            dest[cursor++] = bytes[i];                                                             \
        }                                                                                          \
    }

// =================================================================================================
// Instruction opcodes
// =================================================================================================
static inline void movabs(uint8_t *dest, size_t *cursor_, uint8_t reg_id, uint64_t value)
{
    size_t cursor = *cursor_;

    // REX prefix
    APPEND_U8_TO_DEST(reg_id >= REX_BOUNDARY ? 0x49 : 0x48);

    // ModRM byte
    reg_id = reg_id & 0x7;
    APPEND_U8_TO_DEST(0xb8 + reg_id);

    // Immediate value
    APPEND_U64_TO_DEST(value);
    *cursor_ = cursor;
}

// =================================================================================================
// Helper functions
// =================================================================================================

/// @brief Get the address of a function within a section
/// @param section_id ID of the section
/// @param function_id ID of the function
/// @return Virtual address of the function
static uint64_t get_function_addr(uint64_t section_id, uint64_t function_id)
{
    uint64_t section_base = 0;

    if (actors[section_id].mode == MODE_HOST) {
        section_base = (uint64_t)sandbox->code[section_id].section;
    } else if (actors[section_id].mode == MODE_GUEST) {
        guest_memory_t *guest_memory = (guest_memory_t *)GUEST_V_MEMORY_START;
        section_base = (uint64_t)guest_memory->code.section;
    }

    // The code section of the main actor begins after a hardcoded prologue,
    // which we need to take into account when calculating the function address
    if (section_id == 0)
        section_base += get_main_prologue_size();

    return section_base + test_case->symbol_table[function_id].offset;
}

/// @brief Insert a sequence of instructions into dest that updates R14 to match
///        the actor owning section_id
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_r14(uint64_t section_id, uint8_t *dest, uint64_t cursor)
{
    uint64_t old_cursor = cursor;

    // calculate the new R14 value
    uint64_t new_r14 = 0;
    if (actors[section_id].mode == MODE_HOST) {
        new_r14 = (uint64_t)sandbox->data[section_id].main_area;
    } else if (actors[section_id].mode == MODE_GUEST) {
        guest_memory_t *guest_memory = (guest_memory_t *)GUEST_V_MEMORY_START;
        new_r14 = (uint64_t)guest_memory->data.main_area;
    }

    // ASM: movabs r14, new_r14
    APPEND_BYTES_TO_DEST(0x49, 0xbe);
    APPEND_U64_TO_DEST(new_r14);
    return cursor - old_cursor;
}

/// @brief Insert a sequence of instructions into dest that updates R14 and RSP to match
///        the actor owning section_id
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_mem_base_and_sp(uint64_t section_id, uint8_t *dest, uint64_t cursor)
{
    uint64_t old_cursor = cursor;
    cursor += update_r14(section_id, dest, cursor);

    // calculate the new RSP value
    uint64_t new_rsp = 0;
    if (actors[section_id].mode == MODE_HOST) {
        new_rsp = (uint64_t)sandbox->data[section_id].main_area + LOCAL_RSP_OFFSET;
    } else if (actors[section_id].mode == MODE_GUEST) {
        guest_memory_t *guest_memory = (guest_memory_t *)GUEST_V_MEMORY_START;
        new_rsp = (uint64_t)guest_memory->data.main_area + LOCAL_RSP_OFFSET;
    }

    // ASM: movabs rsp, new_rsp
    APPEND_BYTES_TO_DEST(0x48, 0xbc);
    APPEND_U64_TO_DEST(new_rsp);
    return cursor - old_cursor;
}

/// @brief Insert a sequence of instructions into dest that updates R15 to match the actor
///        owning section_id
/// @param section_id ID of the section
/// @param dest Pointer to the destination of the code sequence
/// @param cursor Current position in the destination buffer
/// @return Number of bytes written to the destination buffer
static uint64_t update_r15(uint64_t section_id, uint8_t *dest, uint64_t cursor)
{
    uint64_t old_cursor = cursor;

    // calculate the new R15 value
    uint64_t new_r15 = 0;
    if (actors[section_id].mode == MODE_HOST) {
        new_r15 = (uint64_t)sandbox->util;
    } else if (actors[section_id].mode == MODE_GUEST) {
        guest_memory_t *guest_memory = (guest_memory_t *)GUEST_V_MEMORY_START;
        new_r15 = (uint64_t)&guest_memory->util;
    }

    // ASM: movabs r15, new_r15
    APPEND_BYTES_TO_DEST(0x49, 0xbf);
    APPEND_U64_TO_DEST(new_r15);
    return cursor - old_cursor;
}

// =================================================================================================
// Macro implementations
//
// Note: A macro consists of two parts: it starts with the dynamically-generated part,
// and the main body is static.
// The dynamic part is generated by the start_macro* functions, and the generated code
// can be configured according to the macro arguments.
// The body_macro* functions are not configurable, and are copied directly into the test case
// macro memory.
// =================================================================================================

// MEASUREMENT_START and MEASUREMENT_END -----------------------------------------------------------
// Prime+Probe variants
static void __attribute__((noipa)) body_macro_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                                                //
                       MACRO_PROLOGUE()                                  //
                       "lea rax, [r15 + " xstr(L1D_PRIMING_OFFSET) "]\n" //
                       PRIME("rax", "rbx", "rcx", "rdx", "32")           //
                       READ_PFC_START()                                  //
                       SET_SR_STARTED()                                  //
                       MACRO_EPILOGUE()                                  //
                       "lfence\n"                                        //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_fast_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                                                //
                       MACRO_PROLOGUE()                                  //
                       "lea rax, [r15 + " xstr(L1D_PRIMING_OFFSET) "]\n" //
                       PRIME("rax", "rbx", "rcx", "rdx", "1")            //
                       READ_PFC_START()                                  //
                       SET_SR_STARTED()                                  //
                       MACRO_EPILOGUE()                                  //
                       "lfence\n"                                        //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_partial_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                                                //
                       MACRO_PROLOGUE()                                  //
                       "lea rax, [r15 + " xstr(L1D_PRIMING_OFFSET) "]\n" //
                       PRIME_PARTIAL("rax", "rbx", "rcx", "rdx", "32")   //
                       READ_PFC_START()                                  //
                       SET_SR_STARTED()                                  //
                       MACRO_EPILOGUE()                                  //
                       "lfence\n"                                        //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_fast_partial_prime(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                                                //
                       MACRO_PROLOGUE()                                  //
                       "lea rax, [r15 + " xstr(L1D_PRIMING_OFFSET) "]\n" //
                       PRIME_PARTIAL("rax", "rbx", "rcx", "rdx", "1")    //
                       READ_PFC_START()                                  //
                       SET_SR_STARTED()                                  //
                       MACRO_EPILOGUE()                                  //
                       "lfence\n"                                        //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_probe(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    // clang-format off
    asm_volatile_intel(""
                       "cmp " STATUS_REGISTER_8 ", "xstr(STATUS_STARTED)"\n"
                       "jne 99f\n"
                       MACRO_PROLOGUE()
                       "push r15\n"
                       "lfence\n"
                       READ_PFC_END()
                       "lea r15, [r15 + " xstr(L1D_PRIMING_OFFSET) "]\n"
                       PROBE("r15", "rbx", "r11", HTRACE_REGISTER)
                       "pop r15\n"
                       "mov qword ptr [rsp - 8], 0 \n"
                       SET_SR_ENDED()
                       MACRO_EPILOGUE()
                       "99:\n"
    );
    // clang-format on
    asm volatile(".quad " xstr(MACRO_END));
}

// Flush + Reload and variants
static void __attribute__((noipa)) body_macro_flush(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                  //
                       MACRO_PROLOGUE()    //
                       "lea rbx, [r14]\n"  //
                       FLUSH("rbx", "rax") //
                       READ_PFC_START()    //
                       SET_SR_STARTED()    //
                       MACRO_EPILOGUE()    //
                       "lfence\n"          //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_reload(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    // clang-format off
    asm_volatile_intel(""
                       "cmp " STATUS_REGISTER_8 ", "xstr(STATUS_STARTED)"\n"
                       "jne 98f\n"
                       MACRO_PROLOGUE()
                       "lfence\n"
                       READ_PFC_END()
                       RELOAD("r14", "rbx", "r11", HTRACE_REGISTER)
                       "mov rax, 1\n"
                       "shl rax, 63\n"
                       "or " HTRACE_REGISTER ", rax\n"
                       SET_SR_ENDED()
                       MACRO_EPILOGUE()
                       "98:\n"
    );
    // clang-format on
    asm volatile(".quad " xstr(MACRO_END));
}

// Time stamp counter
static void __attribute__((noipa)) body_macro_tsc_start(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel(""                                               //
                       MACRO_PROLOGUE()                                 //
                       "lfence; rdtsc; lfence\n"                        //
                       "shl rdx, 32\n"                                  //
                       "or rdx, rax\n"                                  //
                       "xor " HTRACE_REGISTER ", " HTRACE_REGISTER "\n" //
                       "sub " HTRACE_REGISTER ", rdx\n"                 //
                       "lfence\n"                                       //
                       READ_PFC_START()                                 //
                       SET_SR_STARTED()                                 //
                       MACRO_EPILOGUE()                                 //
                       "lfence\n"                                       //
    );
    asm volatile(".quad " xstr(MACRO_END));
}

static void __attribute__((noipa)) body_macro_tsc_end(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    // clang-format off
    asm_volatile_intel(""
                       "cmp " STATUS_REGISTER_8 ", "xstr(STATUS_STARTED)"\n"
                       "jne 97f\n"
                       MACRO_PROLOGUE()
                       READ_PFC_END()
                       "lfence; rdtsc; lfence\n"
                       "shl rdx, 32\n"
                       "or rdx, rax\n"
                       "add " HTRACE_REGISTER ", rdx\n"
                       SET_SR_ENDED()
                       MACRO_EPILOGUE()
                       "97:\n"
    );
    // clang-format on
    asm volatile(".quad " xstr(MACRO_END));
}

// FAULT_HANDLER -------------------------------------------------------------------------------
static inline size_t start_macro_fault_handler(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    ASSERT(args.owner == 0, "inject_macro_configurable_part");

    // Set new global address to the fault handler
    fault_handler = (char *)((uint64_t)dest + cursor);

    // Ensure that RSP, R14, and R15 are set to correct values after (potential) actor switch
    cursor += update_mem_base_and_sp(0, dest, cursor);
    cursor += update_r15(0, dest, cursor);

    // Check for nested faults; if so, jump to `test_case_handler`
    uint64_t is_nested_fault_addr = (uint64_t)&is_nested_fault;
    uint64_t test_case_handler_addr = (uint64_t)nested_fault_handler;
    //   ASM: movabs TMP_REG, is_nested_fault_addr
    movabs(dest, &cursor, TMP_REG_ID, is_nested_fault_addr);
    //   ASM: cmp byte ptr [TMP_REG], 0
    APPEND_BYTES_TO_DEST(0x41, 0x80, 0x3b, 0x00);
    //   ASM: je no_nested_fault
    APPEND_BYTES_TO_DEST(0x74, 0x10);
    //   ASM: lfence
    APPEND_BYTES_TO_DEST(0x0f, 0xae, 0xe8);
    //   ASM: movabs TMP_REG, test_case_handler_addr
    movabs(dest, &cursor, TMP_REG_ID, test_case_handler_addr);
    //   ASM: jmp TMP_REG
    APPEND_BYTES_TO_DEST(0x41, 0xff, 0xe3);
    //   ASM: no_nested_fault:
    //   ASM: incb byte ptr [TMP_REG]
    APPEND_BYTES_TO_DEST(0x41, 0xfe, 0x03);
    return cursor;
}

// FAULT_HANDLER_WITH_MEASUREMENT ------------------------------------------------------------------
static inline size_t start_macro_fault_handler_with_measurement(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    cursor += update_r14(args.arg1, dest, cursor);
    cursor += update_r15(args.arg1, dest, cursor);
    return cursor;
}

// MACRO_SWITCH ------------------------------------------------------------------------------------
static inline size_t start_macro_switch(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    // Update RSP and R14 to the addresses within the new actor's memory
    cursor += update_mem_base_and_sp(args.arg1, dest, cursor);

    // Determine the target address for the switch
    uint64_t switch_target = get_function_addr(args.arg1, args.arg2);
    uint32_t relative_offset = switch_target - (uint64_t)dest - cursor - 5;

    // Jump to the target address (in a different actor) via a relative offset
    // ASM: jmp [RIP + relative_offset]
    APPEND_BYTES_TO_DEST(0xe9);
    APPEND_U32_TO_DEST(relative_offset);
    return cursor;
}

// MACRO_SET_K2U_TARGET ----------------------------------------------------------------------------
static inline size_t start_macro_set_k2u_target(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;

    // ASM: movabs r11, function_addr
    uint64_t function_addr = get_function_addr(args.arg1, args.arg2);
    APPEND_BYTES_TO_DEST(0x49, 0xbb);
    APPEND_U64_TO_DEST(function_addr);

    return cursor;
}

// MACRO_SWITCH_K2U --------------------------------------------------------------------------------
static inline size_t start_macro_switch_k2u(macro_args_t /*args*/, uint8_t * /*dest*/) { return 0; }

static void __attribute__((noipa)) body_macro_switch_k2u(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    // clang-format off
    asm_volatile_intel(""
                       "mov rcx, r11\n"
                       "mov qword ptr [r14 - " xstr(MACRO_STACK_TOP_OFFSET) " - 8], rsp\n"
                       "lea rsp, [r14 - " xstr(MACRO_STACK_TOP_OFFSET) " - 8]\n"
                       "pushfq\n"
                       "pop r11\n"
                       "pop rsp\n"
                       "sysretq\n");
    // clang-format on
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_SET_U2K_TARGET ----------------------------------------------------------------------------
static inline size_t start_macro_set_u2k_target(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    uint64_t function_addr = get_function_addr(args.arg1, args.arg2);
    uint32_t macro_stack_offset = -MACRO_STACK_TOP_OFFSET - 8;

    // ASM: mov [r14 - MACRO_STACK_TOP_OFFSET - 8],rsp
    APPEND_BYTES_TO_DEST(0x49, 0x89, 0xa6);
    APPEND_U32_TO_DEST(macro_stack_offset);
    // ASM: lea rsp,[r14 - MACRO_STACK_TOP_OFFSET - 8]
    APPEND_BYTES_TO_DEST(0x49, 0x8d, 0xa6);
    APPEND_U32_TO_DEST(macro_stack_offset);
    // ASM: push rax
    APPEND_U8_TO_DEST(0x50);
    // ASM: push rcx
    APPEND_U8_TO_DEST(0x51);
    // ASM: push rdx
    APPEND_U8_TO_DEST(0x52);
    // ASM: pushf
    APPEND_U8_TO_DEST(0x9c);
    // ASM: movabs rax, function_addr
    APPEND_BYTES_TO_DEST(0x48, 0xb8);
    APPEND_U64_TO_DEST(function_addr);
    // ASM: mov rdx, rax
    APPEND_BYTES_TO_DEST(0x48, 0x89, 0xc2);
    // ASM: shr rdx, 0x20
    APPEND_BYTES_TO_DEST(0x48, 0xc1, 0xea, 0x20);
    // ASM: movabs rcx, 0xc0000082
    APPEND_BYTES_TO_DEST(0x48, 0xb9);
    APPEND_U64_TO_DEST(0xc0000082);
    // ASM: wrmsr
    APPEND_BYTES_TO_DEST(0x0f, 0x30);
    // ASM: popf
    APPEND_U8_TO_DEST(0x9d);
    // ASM: mov qword ptr [rsp - 0x08], 0
    APPEND_BYTES_TO_DEST(0x48, 0xc7, 0x44, 0x24, 0xf8, 0x00, 0x00, 0x00, 0x00);
    // ASM: pop    rdx
    APPEND_U8_TO_DEST(0x5a);
    // ASM: mov qword ptr [rsp - 0x08], 0
    APPEND_BYTES_TO_DEST(0x48, 0xc7, 0x44, 0x24, 0xf8, 0x00, 0x00, 0x00, 0x00);
    // ASM: pop    rcx
    APPEND_U8_TO_DEST(0x59);
    // ASM: mov qword ptr [rsp - 0x08], 0
    APPEND_BYTES_TO_DEST(0x48, 0xc7, 0x44, 0x24, 0xf8, 0x00, 0x00, 0x00, 0x00);
    // ASM: pop    rax
    APPEND_U8_TO_DEST(0x58);
    // ASM: mov qword ptr [rsp - 0x08], 0
    APPEND_BYTES_TO_DEST(0x48, 0xc7, 0x44, 0x24, 0xf8, 0x00, 0x00, 0x00, 0x00);
    // ASM: pop    rsp
    APPEND_U8_TO_DEST(0x5c);

    return cursor;
}

// MACRO_SWITCH_U2K --------------------------------------------------------------------------------
static void __attribute__((noipa)) body_macro_switch_u2k(void)
{
    asm volatile(".quad " xstr(MACRO_START));
    asm_volatile_intel("syscall\n");
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_SET_H2G_TARGET ----------------------------------------------------------------------------
static inline size_t start_macro_set_h2g_target(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;

    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        uint64_t function_addr = get_function_addr(args.arg1, args.arg2);
        uint64_t vmcs_hpa_addr = (uint64_t)&vmcs_hpas[args.arg1];

        // ASM: movabs r11, &vmcs_hpa
        APPEND_BYTES_TO_DEST(0x49, 0xbb);
        APPEND_U64_TO_DEST(vmcs_hpa_addr);
        // ASM: vmptrld [r11]
        APPEND_BYTES_TO_DEST(0x41, 0x0f, 0xc7, 0x33);
        // ASM: movabs r11, function_addr
        APPEND_BYTES_TO_DEST(0x49, 0xbb);
        APPEND_U64_TO_DEST(function_addr);

    } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        uint64_t function_addr = get_function_addr(args.arg1, args.arg2);
        uint64_t vmcb_hva_addr = (uint64_t)&vmcb_hvas[args.arg1];

        // ASM: movabs r11, &vmcb_hva
        APPEND_BYTES_TO_DEST(0x49, 0xbb);
        APPEND_U64_TO_DEST(vmcb_hva_addr);
        // ASM: mov r11, [r11]
        APPEND_BYTES_TO_DEST(0x4d, 0x8b, 0x1b);
        // ASM: add r11, VMCB_RIP_OFFSET
        APPEND_BYTES_TO_DEST(0x49, 0x81, 0xc3);
        APPEND_U32_TO_DEST(VMCB_RIP_OFFSET);
        // ASM: mov dword ptr [r11], function_addr[0:31]
        APPEND_BYTES_TO_DEST(0x49, 0xc7, 0x03);
        APPEND_U32_TO_DEST(function_addr & 0xFFFFFFFF);
        // ASM: add r11, 4
        APPEND_BYTES_TO_DEST(0x49, 0x83, 0xc3, 0x04);
        // ASM: mov dword ptr [r11], function_addr[32:63]
        APPEND_BYTES_TO_DEST(0x49, 0xc7, 0x03);
        APPEND_U32_TO_DEST((function_addr >> 32) & 0xFFFFFFFF);
    }

    return cursor;
}

static void __attribute__((noipa)) body_macro_set_h2g_target(void)
{
    asm volatile(".quad " xstr(MACRO_START));
#if VENDOR_ID == 1
    asm_volatile_intel(""                      // r11 contains the target address
                       MACRO_PROLOGUE()        //
                       "mov rcx, 0x0000681e\n" // GUEST_RIP
                       "vmwrite rcx, r11 \n"   //
                       MACRO_EPILOGUE()        //
    );
#else
    // Nothing on AMD
#endif
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_SWITCH_H2G --------------------------------------------------------------------------------
static inline size_t start_macro_switch_h2g(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        // Nothing for Intel
    } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        // ASM: movabs rax, &vmcb_hpa
        APPEND_BYTES_TO_DEST(0x48, 0xb8);
        APPEND_U64_TO_DEST((uint64_t)&vmcb_hpas[args.arg1]);
    }
    return cursor;
}

static void __attribute__((noipa)) body_macro_switch_h2g(void)
{
    asm volatile(".quad " xstr(MACRO_START));
#if VENDOR_ID == 1
    asm_volatile_intel("vmresume\n");
#else
    asm_volatile_intel("" // rax contains the current VMCB pointer
                       "clgi\n"
                       "mov rax, qword ptr [rax]\n" //
                       "vmsave rax\n"               //
                       "vmrun rax\n"                //
                       "vmload rax\n"
                       "mov rax, 0\n" //
                       "stgi\n"       //
                       "");
#endif
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_SET_G2H_TARGET ----------------------------------------------------------------------------
static inline size_t start_macro_set_g2h_target(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        // ASM: movabs r11, function_addr
        uint64_t function_addr = get_function_addr(args.arg1, args.arg2);
        APPEND_BYTES_TO_DEST(0x49, 0xbb);
        APPEND_U64_TO_DEST(function_addr);
    } else {
        // Nothing for AMD
    }
    return cursor;
}

static void __attribute__((noipa)) body_macro_set_g2h_target(void)
{
    asm volatile(".quad " xstr(MACRO_START));
#if VENDOR_ID == VENDOR_INTEL_
    asm_volatile_intel(""                      // r11 contains the target address
                       MACRO_PROLOGUE()        //
                       "mov rcx, 0x00006c16\n" // HOST_RIP
                       "vmwrite rcx, r11 \n"   //
                       MACRO_EPILOGUE()        //
    );
#else
    // Nothing on AMD
#endif
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_SWITCH_G2H --------------------------------------------------------------------------------
static void __attribute__((noipa)) body_macro_switch_g2h(void)
{
    asm volatile(".quad " xstr(MACRO_START));
#if VENDOR_ID == 1
    asm_volatile_intel("vmcall\n");
#else
    asm_volatile_intel("vmmcall\n");
#endif
    asm volatile(".quad " xstr(MACRO_END));
}

// MACRO_LANDING_K2U -------------------------------------------------------------------------------
static inline size_t start_macro_landing_k2u(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    cursor += update_mem_base_and_sp(args.owner, dest, cursor);
    // ASM: movabs rcx, 0  # rcx was corrupted during context switch; set to zero
    APPEND_BYTES_TO_DEST(0x48, 0xb9);
    APPEND_U64_TO_DEST(0);
    return cursor;
}

// MACRO_LANDING_U2K -------------------------------------------------------------------------------
static inline size_t start_macro_landing_u2k(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    cursor += update_r14(args.owner, dest, cursor);
    // rsp is automatically restored by syscall instruction

    // ASM: movabs rcx, 0  # rcx was corrupted during context switch; set to zero
    APPEND_BYTES_TO_DEST(0x48, 0xb9);
    APPEND_U64_TO_DEST(0);

    return cursor;
}

// MACRO_LANDING_H2G -------------------------------------------------------------------------------
static inline size_t start_macro_landing_h2g(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    cursor += update_r14(args.owner, dest, cursor);
    cursor += update_r15(args.owner, dest, cursor);

    if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        // ASM: mov rax, 0
        APPEND_BYTES_TO_DEST(0x48, 0xc7, 0xc0, 0x00, 0x00, 0x00, 0x00);
    }
    return cursor;
}

// MACRO_LANDING_G2H -------------------------------------------------------------------------------
static inline size_t start_macro_landing_g2h(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    cursor += update_r14(args.owner, dest, cursor);
    cursor += update_r15(args.owner, dest, cursor);

    if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        // ASM: mov rax, 0
        APPEND_BYTES_TO_DEST(0x48, 0xc7, 0xc0, 0x00, 0x00, 0x00, 0x00);
    }

    return cursor;
}

// MACRO_SET_DATA_PERMISSIONS ----------------------------------------------------------------------
static inline size_t start_macro_set_data_permissions(macro_args_t args, uint8_t *dest)
{
    size_t cursor = 0;
    // get safe bits to set/clear
    uint16_t mask_set = args.arg2;
    uint16_t mask_clear = args.arg3;

    // get the target PTE
    uint64_t actor_id = args.arg1;
    uint64_t page_id = (actor_id * N_DATA_PAGES_PER_ACTOR) + FAULTY_PAGE_ID;
    pte_t_ *ptep = sandbox_pteps->data_pteps[page_id];
    ASSERT(ptep != NULL, "start_macro_set_data_permissions");

    uint32_t macro_stack_offset = -MACRO_STACK_TOP_OFFSET - 8;

    // Switch stack
    // ASM: mov [r14 - MACRO_STACK_TOP_OFFSET - 8],rsp
    APPEND_BYTES_TO_DEST(0x49, 0x89, 0xa6);
    APPEND_U32_TO_DEST(macro_stack_offset);
    // ASM: lea rsp,[r14 - MACRO_STACK_TOP_OFFSET - 8]
    APPEND_BYTES_TO_DEST(0x49, 0x8d, 0xa6);
    APPEND_U32_TO_DEST(macro_stack_offset);
    // ASM: push rax
    APPEND_U8_TO_DEST(0x50);

    // Get pointer to PTE
    // ASM: mov rax, ptep
    APPEND_BYTES_TO_DEST(0x48, 0xb8);
    APPEND_U64_TO_DEST((uint64_t)ptep);

    // Apply the set and clear masks to the lowest 16 bits of the PTE
    // note that we leave the remaining bits unchanged because arg2 and arg3 are 16-bit values
    //   ASM: or qword ptr [r11], mask_set
    APPEND_BYTES_TO_DEST(0x66, 0x81, 0x08);
    APPEND_U16_TO_DEST(mask_set);
    //   ASM: and qword ptr [r11], mask_clear
    APPEND_BYTES_TO_DEST(0x66, 0x81, 0x20);
    APPEND_U16_TO_DEST(mask_clear);

    // Restore stack
    // ASM: pop rax
    APPEND_U8_TO_DEST(0x58);
    // ASM: mov qword ptr [rsp - 0x08], 0
    APPEND_BYTES_TO_DEST(0x48, 0xc7, 0x44, 0x24, 0xf8, 0x00, 0x00, 0x00, 0x00);
    // ASM: pop rsp
    APPEND_U8_TO_DEST(0x5c);
    return cursor;
}

// =================================================================================================
// Macro descriptors
// =================================================================================================
macro_descr_t macro_descriptors[] = {
    [TYPE_UNDEFINED] = {.start = NULL, .body = NULL},
    [TYPE_PRIME] = {.start = NULL, .body = body_macro_prime},
    [TYPE_FAST_PRIME] = {.start = NULL, .body = body_macro_fast_prime},
    [TYPE_PARTIAL_PRIME] = {.start = NULL, .body = body_macro_partial_prime},
    [TYPE_FAST_PARTIAL_PRIME] = {.start = NULL, .body = body_macro_fast_partial_prime},
    [TYPE_PROBE] = {.start = NULL, .body = body_macro_probe},
    [TYPE_FLUSH] = {.start = NULL, .body = body_macro_flush},
    [TYPE_EVICT] = {.start = NULL, .body = body_macro_prime},
    [TYPE_RELOAD] = {.start = NULL, .body = body_macro_reload},
    [TYPE_TSC_START] = {.start = NULL, .body = body_macro_tsc_start},
    [TYPE_TSC_END] = {.start = NULL, .body = body_macro_tsc_end},
    [TYPE_FAULT_HANDLER] = {.start = start_macro_fault_handler, .body = NULL},
    [TYPE_FAULT_AND_PROBE] = {.start = start_macro_fault_handler_with_measurement,
                              .body = body_macro_probe},
    [TYPE_FAULT_AND_RELOAD] = {.start = start_macro_fault_handler_with_measurement,
                               .body = body_macro_reload},
    [TYPE_FAULT_AND_TSC_END] = {.start = start_macro_fault_handler_with_measurement,
                                .body = body_macro_tsc_end},
    [TYPE_SWITCH] = {.start = start_macro_switch, .body = NULL},
    [TYPE_SET_K2U_TARGET] = {.start = start_macro_set_k2u_target, .body = NULL},
    [TYPE_SWITCH_K2U] = {.start = start_macro_switch_k2u, .body = body_macro_switch_k2u},
    [TYPE_SET_U2K_TARGET] = {.start = start_macro_set_u2k_target, .body = NULL},
    [TYPE_SWITCH_U2K] = {.start = NULL, .body = body_macro_switch_u2k},
    [TYPE_SET_H2G_TARGET] = {.start = start_macro_set_h2g_target,
                             .body = body_macro_set_h2g_target},
    [TYPE_SWITCH_H2G] = {.start = start_macro_switch_h2g, .body = body_macro_switch_h2g},
    [TYPE_SET_G2H_TARGET] = {.start = start_macro_set_g2h_target,
                             .body = body_macro_set_g2h_target},
    [TYPE_SWITCH_G2H] = {.start = NULL, .body = body_macro_switch_g2h},
    [TYPE_LANDING_K2U] = {.start = start_macro_landing_k2u, .body = NULL},
    [TYPE_LANDING_U2K] = {.start = start_macro_landing_u2k, .body = NULL},
    [TYPE_LANDING_H2G] = {.start = start_macro_landing_h2g, .body = NULL},
    [TYPE_LANDING_G2H] = {.start = start_macro_landing_g2h, .body = NULL},
    [TYPE_SET_DATA_PERMISSIONS] = {.start = start_macro_set_data_permissions, .body = NULL},
};


================================================
FILE: rvzr/executor_km/x86/page_tables_guest.c
================================================
/// File:
///  - Guest page table management
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/io.h>
#include <asm/msr.h>

#include "actor.h"
#include "hardware_desc.h"
#include "main.h"
#include "sandbox_manager.h"
#include "shortcuts.h"

#include "page_tables_common.h"
#include "page_tables_guest.h"

#define INIT_PTE(PTE, PADDR, P, W, US, PWT, PCD, XD, A)                                            \
    {                                                                                              \
        (PTE).present = P;                                                                         \
        (PTE).write_access = W;                                                                    \
        (PTE).user_supervisor = US;                                                                \
        (PTE).page_write_through = PWT;                                                            \
        (PTE).page_cache_disable = PCD;                                                            \
        (PTE).paddr = (PADDR) >> 12;                                                               \
        (PTE).execute_disable = XD;                                                                \
        (PTE).accessed = A;                                                                        \
    }

#if VENDOR_ID == VENDOR_INTEL_
#define INIT_EPTE(PTE, PADDR, P, W, X, A)                                                          \
    {                                                                                              \
        (PTE).read_access = P;                                                                     \
        (PTE).write_access = W;                                                                    \
        (PTE).execute_access = X;                                                                  \
        (PTE).paddr = (PADDR) >> 12;                                                               \
        (PTE).accessed = A;                                                                        \
    }
#else // AMD
#define INIT_EPTE(PTE, PADDR, P, W, X, A)                                                          \
    {                                                                                              \
        (PTE).present = P;                                                                         \
        (PTE).write_access = W;                                                                    \
        (PTE).user_supervisor = 1;                                                                 \
        (PTE).page_write_through = 0;                                                              \
        (PTE).page_cache_disable = 0;                                                              \
        (PTE).paddr = (PADDR) >> 12;                                                               \
        (PTE).execute_disable = X ^ 1;                                                             \
        (PTE).accessed = A;                                                                        \
    }
#endif

#define INIT_PTE_DEFAULT(PTE, PADDR)  INIT_PTE(PTE, PADDR, 1, 1, 0, 0, 0, 0, 1)
#define INIT_EPTE_DEFAULT(PTE, PADDR) INIT_EPTE(PTE, PADDR, 1, 1, 1, 1)

#if VENDOR_ID == VENDOR_INTEL_
#define EPTE_IS_PRESENT(EPT) EPT.read_access
#else
#define EPTE_IS_PRESENT(EPT) EPT.present
#endif

#if VENDOR_ID == VENDOR_INTEL_
#define EPTE_IS_EXECUTABLE(EPT) EPT.execute_access
#else
#define EPTE_IS_EXECUTABLE(EPT) (EPT.execute_disable ^ 1)
#endif

#if VENDOR_ID == VENDOR_INTEL_
#define EPTE_IS_USER_ACCESSIBLE(EPT) EPT.user_ex_access
#else
#define EPTE_IS_USER_ACCESSIBLE(EPT) EPT.user_supervisor
#endif

eptp_t *ept_ptr = NULL; // global

static actor_page_table_t *allocated_page_tables = NULL;
static actor_ept_t *allocated_extended_page_tables = NULL;
static actor_gdt_t *allocated_guest_gdts = NULL;
static guest_memory_translations_t *guest_memory_translations = NULL;
static uint8_t *vmlaunch_page = NULL;
static pte_t_ *faulty_ptes = NULL;
static epte_t_ *faulty_eptes = NULL;

static bool guest_pt_is_set = false;
static bool ept_is_set = false;

// =================================================================================================
// Helper functions
// =================================================================================================
/// @brief Translate a host physical address to a virtual address in high memory.
/// Note: This function is necessary because kernel does not provide a direct interface to search
/// for a physical address in page tables (or at least I couldn't find one)
/// @param hpa Host physical address to translate
/// @return Host virtual address in high memory
static void *phys_to_vmalloc(uint64_t hpa, int actor_id)
{
    hgpa_t *flat_translations = (hgpa_t *)&guest_memory_translations[actor_id];
    for (int i = 0; i < sizeof(guest_memory_translations_t) / sizeof(hgpa_t); i++) {
        if (flat_translations[i].hpa == hpa) {
            return flat_translations[i].hva;
        }
    }
    return 0;
}

static inline bool gpa_is_valid(hgpa_t *translations, uint64_t gpa)
{
    for (int i = 0; i < sizeof(guest_memory_translations_t) / sizeof(hgpa_t); i++) {
        if (translations[i].gpa == gpa) {
            return true;
        }
    }
    return false;
}

static inline int set_last_pt_level(pte_t_ *pt, hgpa_t *translation, uint64_t paddr, uint64_t vaddr)
{
    size_t pt_index = PT_INDEX(vaddr);
    ASSERT(pt[pt_index].present == 0, "set_last_pt_level");
    INIT_PTE_DEFAULT(pt[pt_index], paddr);
    pt[pt_index].dirty = 1;

    translation->gpa = paddr;
    translation->gva = (void *)vaddr;
    return 0;
}

static inline int set_ept_entry(actor_ept_t *actor_ept_base, hgpa_t *translation, uint64_t l3_hpa,
                                uint64_t l2_hpa, uint64_t l1_hpa, void *hva)
{
    // get the addresses to map
    uint64_t gpa = translation->gpa;
    uint64_t hpa = vmalloc_to_phys(hva);

    // check for collisions
    // (the way we allocate page could, with very low likelihood, cause a collision)
    ASSERT(actor_ept_base->l1[PT_INDEX(gpa)].paddr == 0, "set_extended_page_tables");
    ASSERT(hpa, "set_extended_page_tables");

    translation->hpa = hpa;
    translation->hva = hva;

    // set all page table levels
    INIT_EPTE_DEFAULT(actor_ept_base->l4[PML4_INDEX(gpa)], l3_hpa);
    INIT_EPTE_DEFAULT(actor_ept_base->l3[PDPT_INDEX(gpa)], l2_hpa);
    INIT_EPTE_DEFAULT(actor_ept_base->l2[PDT_INDEX(gpa)], l1_hpa);
    INIT_EPTE_DEFAULT(actor_ept_base->l1[PT_INDEX(gpa)], hpa);

    // set additional properties for the last level
    actor_ept_base->l1[PT_INDEX(gpa)].dirty = 1;

#if VENDOR_ID == VENDOR_INTEL_
    actor_ept_base->l1[PT_INDEX(gpa)].ept_mem_type = 6;
    actor_ept_base->l1[PT_INDEX(gpa)].ignore_pat = 1;
#else
    actor_ept_base->l1[PT_INDEX(gpa)].page_attribute_table = 1;
#endif

    return 0;
}

// =================================================================================================
// Page table management interface
// =================================================================================================

/// @brief Set the guest page tables for all guest actors according to the layout defined in
/// guest_memory_t (see guest_page_tables.h), with the base address GUEST_MEMORY_START
/// @param void
/// @return 0 on success, -1 on failure
static int set_guest_page_tables(void)
{
    int err = 0;
    uint64_t vaddr = 0;
    uint64_t paddr = 0;

    static size_t old_n_actors = 0;
    if (n_actors > old_n_actors) {
        SAFE_FREE(faulty_ptes);
        SAFE_FREE(faulty_eptes);
        faulty_ptes = (pte_t_ *)CHECKED_ZALLOC(sizeof(pte_t_) * n_actors);
        faulty_eptes = (epte_t_ *)CHECKED_ZALLOC(sizeof(epte_t_) * n_actors);
    }
    old_n_actors = n_actors;

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-guest actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST) {
            continue;
        }

        // get a type that represents the guest memory
        guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
        guest_memory_t *guest_p_memory = (guest_memory_t *)(GUEST_P_MEMORY_START);
        guest_memory_translations_t *translations = &guest_memory_translations[actor_id];

        // Set the first three levels of the page table
        // For convenience, we set GPA of the page tables to the same value as their GVA
        // Also, since the actor's sandbox is fairly small, the first three levels are identical
        // for all addresses within the actor memory
        actor_page_table_t *page_table = &allocated_page_tables[actor_id];
        actor_page_table_t *page_table_gpa = &guest_p_memory->guest_page_tables;
        translations->guest_page_tables[3].gpa = (uint64_t)&page_table_gpa->l4;

        size_t l4_index = PML4_INDEX(GUEST_V_MEMORY_START);
        uint64_t l3_gpa = (uint64_t)&page_table_gpa->l3;
        INIT_PTE_DEFAULT(page_table->l4[l4_index], l3_gpa);
        translations->guest_page_tables[2].gpa = l3_gpa;

        size_t l3_index = PDPT_INDEX(GUEST_V_MEMORY_START);
        uint64_t l2_gpa = (uint64_t)&page_table_gpa->l2;
        INIT_PTE_DEFAULT(page_table->l3[l3_index], l2_gpa);
        translations->guest_page_tables[1].gpa = l2_gpa;

        size_t l2_index = PDT_INDEX(GUEST_V_MEMORY_START);
        uint64_t l1_gpa = (uint64_t)&page_table_gpa->l1;
        INIT_PTE_DEFAULT(page_table->l2[l2_index], l1_gpa);
        translations->guest_page_tables[0].gpa = l1_gpa;

        // set the last level of the page table for each area of the actor sandbox
        for (int i = 0; i < sizeof(util_t); i += 4096) {
            vaddr = ((uint64_t)&guest_v_memory->util) + i;
            paddr = ((uint64_t)&guest_p_memory->util) + i;
            err = set_last_pt_level(page_table->l1, &translations->util[i / 4096], paddr, vaddr);
            CHECK_ERR("set_guest_page_tables");
        }
        for (int i = 0; i < sizeof(actor_data_t); i += 4096) {
            uint64_t vaddr = ((uint64_t)&guest_v_memory->data) + i;
            if (enable_hpa_gpa_collisions) {
                uint64_t aliased_vaddr = ((uint64_t)&sandbox->data[0]) + i;
                paddr = vmalloc_to_phys((void *)aliased_vaddr);
            } else {
                paddr = ((uint64_t)&guest_p_memory->data) + i;
            }
            err = set_last_pt_level(page_table->l1, &translations->data[i / 4096], paddr, vaddr);
            CHECK_ERR("set_guest_page_tables");
        }
        for (int i = 0; i < sizeof(actor_code_t); i += 4096) {
            vaddr = ((uint64_t)&guest_v_memory->code) + i;
            if (enable_hpa_gpa_collisions) {
                uint64_t aliased_vaddr = ((uint64_t)&sandbox->code[0]) + i;
                paddr = vmalloc_to_phys((void *)aliased_vaddr);
            } else {
                paddr = ((uint64_t)&guest_p_memory->code) + i;
            }
            err = set_last_pt_level(page_table->l1, &translations->code[i / 4096], paddr, vaddr);
            CHECK_ERR("set_guest_page_tables");
        }
        { // GDT (indentation is for readability)
            vaddr = (uint64_t)&guest_v_memory->gdt;
            paddr = (uint64_t)&guest_p_memory->gdt;
            err = set_last_pt_level(page_table->l1, &translations->gdt[0], paddr, vaddr);
            CHECK_ERR("set_guest_page_tables");
        }
        { // VMLAUNCH page (indentation is for readability)
            vaddr = (uint64_t)&guest_v_memory->vmlaunch_page[0];
            paddr = (uint64_t)&guest_p_memory->vmlaunch_page[0];
            err = set_last_pt_level(page_table->l1, &translations->vmlaunch_page[0], paddr, vaddr);
            CHECK_ERR("set_guest_page_tables");
        }
    }

    guest_pt_is_set = true;
    return 0;
}

/// @brief Map sandbox_t from host memory into the guest memory of each guest actor, according to
/// the layout defined in guest_memory_t (see page_tables_guest.h), with the base address equal to
/// GUEST_MEMORY_START
/// @param void
/// @return 0 on success, -1 on failure
static int set_extended_page_tables(void)
{
    int err = 0;

    ASSERT(actors != NULL, "set_extended_page_tables");
    ASSERT(sandbox != NULL, "set_extended_page_tables");
    ASSERT(guest_pt_is_set, "set_extended_page_tables");

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-guest actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST) {
            continue;
        }
        actor_ept_t *ept_base = &allocated_extended_page_tables[actor_id];
        guest_memory_translations_t *translations = &guest_memory_translations[actor_id];

        // get addresses of the last three levels
        uint64_t l3_hpa = vmalloc_to_phys((void *)ept_base->l3);
        uint64_t l2_hpa = vmalloc_to_phys((void *)ept_base->l2);
        uint64_t l1_hpa = vmalloc_to_phys((void *)ept_base->l1);

        // map util_t into guest memory (the same phys range for all actors, i.e., shared)
        for (int i = 0; i < sizeof(util_t) / PAGE_SIZE; i += 1) {
            void *hva = (void *)&sandbox->util[0] + (i * PAGE_SIZE);
            err = set_ept_entry(ept_base, &translations->util[i], l3_hpa, l2_hpa, l1_hpa, hva);
            CHECK_ERR("set_extended_page_tables");
        }

        // map actor_data_t, actor_code_t, and GDT into guest memory (each actor has its own)
        for (int i = 0; i < sizeof(actor_data_t) / PAGE_SIZE; i += 1) {
            void *hva = (void *)&sandbox->data[actor_id] + (i * PAGE_SIZE);
            err = set_ept_entry(ept_base, &translations->data[i], l3_hpa, l2_hpa, l1_hpa, hva);
            CHECK_ERR("set_extended_page_tables");
        }
        for (int i = 0; i < sizeof(actor_code_t) / PAGE_SIZE; i += 1) {
            void *hva = (void *)&sandbox->code[actor_id] + (i * PAGE_SIZE);
            err = set_ept_entry(ept_base, &translations->code[i], l3_hpa, l2_hpa, l1_hpa, hva);
            CHECK_ERR("set_extended_page_tables");
        }
        { // indent for readability
            void *hva = (void *)&allocated_guest_gdts[actor_id];
            err = set_ept_entry(ept_base, &translations->gdt[0], l3_hpa, l2_hpa, l1_hpa, hva);
            CHECK_ERR("set_extended_page_tables");
        }
        { // indent for readability
            void *hva = (void *)&vmlaunch_page[0];
            err = set_ept_entry(ept_base, &translations->vmlaunch_page[0], l3_hpa, l2_hpa, l1_hpa,
                                hva);
            CHECK_ERR("set_extended_page_tables");
        }

        // map guest page tables
        for (int i = 0; i < sizeof(actor_page_table_t) / PAGE_SIZE; i += 1) {
            void *hva = (void *)&allocated_page_tables[actor_id] + (i * PAGE_SIZE);
            err = set_ept_entry(ept_base, &translations->guest_page_tables[i], l3_hpa, l2_hpa,
                                l1_hpa, hva);
            CHECK_ERR("set_extended_page_tables");
        }
    }

    ept_is_set = true;
    return 0;
}

/// @brief Store a pointer to the EPT of actor 1 (default) in ept_ptr after updating extended page
/// tables
/// @param void
/// @return 0 on success, -1 on failure
static int update_eptp(void)
{
    ASSERT(ept_is_set, "update_eptp");
    SAFE_FREE(ept_ptr);
    ept_ptr = CHECKED_ZALLOC(sizeof(eptp_t) * n_actors);
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_ept_t *actor_ept_base = &allocated_extended_page_tables[actor_id];
        ept_ptr[actor_id].memory_type = VMX_BASIC_MEM_TYPE_WB;
        ept_ptr[actor_id].page_walk_length = 3;
        ept_ptr[actor_id].ad_enabled = 1; // native_read_msr(MSR_IA32_VMX_EPT_VPID_CAP) &0x00200000;
        ept_ptr[actor_id].superv_sdw_stack = 0;
        ept_ptr[actor_id].paddr = vmalloc_to_phys(actor_ept_base->l4) >> 12;
    }

    return 0;
}

int map_sandbox_to_guest_memory(void)
{
    int err = 0;
    ASSERT(allocated_page_tables != NULL, "map_sandbox_to_guest_memory");
    ASSERT(allocated_extended_page_tables != NULL, "map_sandbox_to_guest_memory");
    ASSERT(allocated_guest_gdts != NULL, "map_sandbox_to_guest_memory");

    err = set_guest_page_tables();
    CHECK_ERR("set_guest_page_tables");

    err = set_extended_page_tables();
    CHECK_ERR("set_extended_page_tables");

    err = update_eptp();
    CHECK_ERR("update_eptp");

    return 0;
}

/// @brief Set permissions on the faulty page based on the actor's metadata (for each actor)
/// @param void
void set_faulty_page_guest_permissions(void)
{
    guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
    uint64_t vaddr = ((uint64_t)&guest_v_memory->data.faulty_area[0]);
    size_t index = PT_INDEX(vaddr);

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        uint64_t pte_mask = actor->data_permissions;
        uint64_t mask_set = pte_mask & MODIFIABLE_PTE_BITS;
        uint64_t mask_clear = pte_mask | ~MODIFIABLE_PTE_BITS;

        pte_t_ *ptep = &allocated_page_tables[actor_id].l1[index];
        faulty_ptes[actor_id] = *ptep;

        uint64_t org_pte = *(uint64_t *)ptep;
        uint64_t pte = (org_pte | mask_set) & mask_clear;
        if (pte != org_pte) {
            *(uint64_t *)ptep = pte;
            // native_page_invalidate(vaddr);
        }
    }
}

void restore_faulty_page_guest_permissions(void)
{
    guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
    uint64_t vaddr = ((uint64_t)&guest_v_memory->data.faulty_area[0]);
    size_t index = PT_INDEX(vaddr);

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        allocated_page_tables[actor_id].l1[index] = faulty_ptes[actor_id];
    }
}

/// @brief Set EPT permissions on the faulty page based on the actor's metadata (for each actor)
/// @param void
void set_faulty_page_ept_permissions(void)
{
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        guest_memory_translations_t *translations = &guest_memory_translations[actor_id];
        uint64_t gpa = translations->data[FAULTY_PAGE_ID].gpa;
        size_t index = PT_INDEX(gpa);

        uint64_t pte_mask = actor->data_ept_properties;
        uint64_t mask_set = pte_mask & MODIFIABLE_EPTE_BITS;
        uint64_t mask_clear = pte_mask | ~MODIFIABLE_EPTE_BITS;

        epte_t_ *ptep = &allocated_extended_page_tables[actor_id].l1[index];
        faulty_eptes[actor_id] = *ptep;

        uint64_t org_pte = *(uint64_t *)ptep;
        uint64_t pte = (org_pte | mask_set) & mask_clear;
        if (pte != org_pte) {
            *(uint64_t *)ptep = pte;
            // native_page_invalidate(vaddr);
        }
    }
}

void restore_faulty_page_ept_permissions(void)
{
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        guest_memory_translations_t *translations = &guest_memory_translations[actor_id];
        uint64_t gpa = translations->data[FAULTY_PAGE_ID].gpa;
        size_t index = PT_INDEX(gpa);

        allocated_extended_page_tables[actor_id].l1[index] = faulty_eptes[actor_id];
    }
}

// =================================================================================================
// Debugging Interfaces
// =================================================================================================

/// @brief Dump the guest page tables for a given actor
/// @param actor_id
/// @return 0 on success, -1 on failure
int dbg_dump_guest_page_tables(int actor_id)
{
    // NOTE: the implementation below traverses page tables as if they were unbounded (i.e.,
    //   contained an unlimited number of PTEs, PDs, etc). This is not the case for the guest page
    //   tables as we have only one PT per actor. However, this implementation is more future-proof,
    //   so we have a traditional page walk, and just check the number of entries with asserts
    printk(KERN_INFO "------- Page table dump for actor %d ---------------\n", actor_id);
    actor_page_table_t *page_table = &allocated_page_tables[actor_id];
    guest_memory_translations_t *translations = &guest_memory_translations[actor_id];

    // L4 traversal
    pml4e_t *l4 = page_table->l4;
    for (uint64_t curr_l4_id = 0; curr_l4_id < ENTRIES_PER_PAGE; curr_l4_id += 1) {
        pml4e_t l4e = l4[curr_l4_id]; // current L4 entry
        if (!l4e.present)
            continue;
        // we allocate memory such that only the first L4 entry is used
        ASSERT(curr_l4_id == 0, "dbg_dump_guest_page_tables");

        uint64_t l3_gpa = ((uint64_t)l4e.paddr << 12);
        ASSERT_MSG(l3_gpa == translations->guest_page_tables[2].gpa, "dbg_dump_guest_page_tables",
                   "0x%llx != 0x%llx\n", l3_gpa, translations->guest_page_tables[2].gpa);
        pdpte_t *l3 = (pdpte_t *)translations->guest_page_tables[2].hva;

        // L3 traversal
        for (uint64_t curr_l3_id = 0; curr_l3_id < ENTRIES_PER_PAGE; curr_l3_id += 1) {
            pdpte_t l3e = l3[curr_l3_id]; // current L3 entry
            if (!l3e.present)
                continue;
            // we allocate memory such that only the first L3 entry is used
            ASSERT(curr_l3_id == 0, "dbg_dump_guest_page_tables");

            uint64_t l2_gpa = ((uint64_t)l3e.paddr << 12);
            ASSERT(l2_gpa == translations->guest_page_tables[1].gpa, "dbg_dump_guest_page_tables");
            pdte_t *l2 = (pdte_t *)translations->guest_page_tables[1].hva;

            // L2 traversal
            for (uint64_t curr_l2_id = 0; curr_l2_id < ENTRIES_PER_PAGE; curr_l2_id += 1) {
                pdte_t l2e = l2[curr_l2_id]; // current L2 entry
                if (!l2e.present)
                    continue;
                ASSERT(curr_l2_id == 0, "dbg_dump_guest_page_tables");

                uint64_t l1_gpa = ((uint64_t)l2e.paddr << 12);
                ASSERT(l1_gpa == translations->guest_page_tables[0].gpa,
                       "dbg_dump_guest_page_tables");
                pte_t_ *l1 = (pte_t_ *)translations->guest_page_tables[0].hva;

                // L1 traversal
                for (uint64_t curr_l1_id = 0; curr_l1_id < ENTRIES_PER_PAGE; curr_l1_id += 1) {
                    pte_t_ l1e = l1[curr_l1_id];
                    if (!l1e.present)
                        continue;
                    uint64_t paddr = ((uint64_t)l1e.paddr << 12);
                    uint64_t vaddr = (curr_l4_id << PML4_SHIFT) | (curr_l3_id << PDPT_SHIFT) |
                                     (curr_l2_id << PDT_SHIFT) | (curr_l1_id << PT_SHIFT);
                    char p = l1e.present ? 'P' : '-';
                    char w = l1e.write_access ? 'W' : '-';
                    char us = l1e.user_supervisor ? 'U' : '-';
                    char pwt = l1e.page_write_through ? 'T' : '-';
                    char pcd = l1e.page_cache_disable ? 'C' : '-';
                    char a = l1e.accessed ? 'A' : '-';
                    char d = l1e.dirty ? 'D' : '-';
                    char pat = l1e.page_attribute_table ? 'T' : '-';
                    char g = l1e.global_page ? 'G' : '-';
                    char x = l1e.execute_disable ? '-' : 'X';
                    printk(KERN_INFO "V: 0x%-16llx -> P: 0x%-16llx; %c%c%c%c%c%c%c%c%c%c\n", vaddr,
                           paddr, p, w, us, pwt, pcd, a, d, pat, g, x);
                }
            }
        }
    }
    return 0;
}

int dbg_dump_ept(int actor_id)
{
    printk(KERN_INFO "------- EPT dump -----------------------------------\n");
    actor_ept_t *actor_ept_base = &allocated_extended_page_tables[actor_id];

    // L4 traversal
    epml4e_t *l4 = actor_ept_base->l4;
    for (uint64_t curr_l4_id = 0; curr_l4_id < ENTRIES_PER_PAGE; curr_l4_id += 1) {
        epml4e_t l4e = l4[curr_l4_id];
        if (!EPTE_IS_PRESENT(l4e))
            continue;
        uint64_t l3_hpa = ((uint64_t)l4e.paddr << 12);
        epdpte_t *l3 = actor_ept_base->l3;
        ASSERT((l3_hpa & ~0xFFF) == vmalloc_to_phys(l3), "dbg_dump_ept");

        // L3 traversal
        for (uint64_t curr_l3_id = 0; curr_l3_id < ENTRIES_PER_PAGE; curr_l3_id += 1) {
            epdpte_t l3e = l3[curr_l3_id];
            if (!EPTE_IS_PRESENT(l3e))
                continue;
            uint64_t l2_hpa = ((uint64_t)l3e.paddr << 12);
            epdte_t *l2 = actor_ept_base->l2;
            ASSERT((l2_hpa & ~0xFFF) == vmalloc_to_phys(l2), "dbg_dump_ept");

            // L2 traversal
            for (uint64_t curr_l2_id = 0; curr_l2_id < ENTRIES_PER_PAGE; curr_l2_id += 1) {
                epdte_t l2e = l2[curr_l2_id];
                if (!EPTE_IS_PRESENT(l2e))
                    continue;
                uint64_t l1_hpa = ((uint64_t)l2e.paddr << 12);
                epte_t_ *l1 = actor_ept_base->l1;
                ASSERT((l1_hpa & ~0xFFF) == vmalloc_to_phys(l1), "dbg_dump_ept");

                // L1 traversal
                for (uint64_t curr_l1_id = 0; curr_l1_id < ENTRIES_PER_PAGE; curr_l1_id += 1) {
                    epte_t_ l1e = l1[curr_l1_id];
                    if (!EPTE_IS_PRESENT(l1e))
                        continue;
                    uint64_t gpa = (curr_l4_id << PML4_SHIFT) | (curr_l3_id << PDPT_SHIFT) |
                                   (curr_l2_id << PDT_SHIFT) | (curr_l1_id << PT_SHIFT);

                    // if HPA-GPA collisions are enabled, we will have multiple translations per
                    // physical address; hence, filter out the unused GPAs
                    if (enable_hpa_gpa_collisions &&
                        !gpa_is_valid((hgpa_t *)&guest_memory_translations[actor_id], gpa)) {
                        continue;
                    }

                    uint64_t hpa = ((uint64_t)l1e.paddr << 12);
                    void *hva = phys_to_vmalloc(hpa, actor_id);
                    char r = EPTE_IS_PRESENT(l1e) ? 'R' : '-';
                    char w = l1e.write_access ? 'W' : '-';
                    char x = EPTE_IS_EXECUTABLE(l1e) ? 'X' : '-';
                    char a = l1e.accessed ? 'A' : '-';
                    char d = l1e.dirty ? 'D' : '-';
                    char us = EPTE_IS_USER_ACCESSIBLE(l1e) ? 'U' : '-';
                    printk(KERN_INFO
                           "GP: 0x%-16llx -> HP: 0x%-16llx (HV: 0x%-16llx); %c%c%c%c%c%c\n",
                           gpa, hpa, (uint64_t)hva, r, w, x, a, d, us);
                }
            }
        }
    }
    return 0;
}

// =================================================================================================
int allocate_guest_page_tables()
{
    ASSERT(n_actors < 64, "allocate_guest_page_tables");

    static size_t old_n_actors = 0;
    if (n_actors <= old_n_actors) {
        memset(allocated_page_tables, 0, n_actors * sizeof(actor_page_table_t));
        memset(allocated_extended_page_tables, 0, n_actors * sizeof(actor_ept_t));
        memset(allocated_guest_gdts, 0, n_actors * sizeof(actor_gdt_t));
        memset(guest_memory_translations, 0, n_actors * sizeof(guest_memory_translations_t));
        return 0;
    }
    old_n_actors = n_actors;
    SAFE_VFREE(allocated_page_tables);
    SAFE_VFREE(allocated_extended_page_tables);
    SAFE_VFREE(allocated_guest_gdts);
    SAFE_FREE(guest_memory_translations);
    SAFE_FREE(vmlaunch_page);

    // Guest page tables
    allocated_page_tables =
        (actor_page_table_t *)CHECKED_VMALLOC(n_actors * sizeof(actor_page_table_t));
    memset(allocated_page_tables, 0, n_actors * sizeof(actor_page_table_t));

    // EPTs
    allocated_extended_page_tables = (actor_ept_t *)CHECKED_VMALLOC(n_actors * sizeof(actor_ept_t));
    memset(allocated_extended_page_tables, 0, n_actors * sizeof(actor_ept_t));

    allocated_guest_gdts = CHECKED_VMALLOC(n_actors * sizeof(actor_gdt_t));

    // Fast translations
    guest_memory_translations = CHECKED_ZALLOC(n_actors * sizeof(guest_memory_translations_t));

    // A page with a single VMCALL instruction; used to put the VM into launched state
    vmlaunch_page = CHECKED_ZALLOC(PAGE_SIZE);
    vmlaunch_page[0] = 0x0f;
    vmlaunch_page[1] = 0x01;
    vmlaunch_page[2] = 0xc1;

    faulty_ptes = (pte_t_ *)CHECKED_ZALLOC(sizeof(pte_t_));
    faulty_eptes = (epte_t_ *)CHECKED_ZALLOC(sizeof(epte_t_));

    guest_pt_is_set = false;
    ept_is_set = false;
    return 0;
}

void free_guest_page_tables(void)
{
    SAFE_VFREE(allocated_page_tables);
    SAFE_VFREE(allocated_extended_page_tables);
    SAFE_VFREE(allocated_guest_gdts);
    SAFE_FREE(guest_memory_translations);
    SAFE_FREE(ept_ptr);
    SAFE_FREE(vmlaunch_page);
    SAFE_FREE(faulty_ptes);
    SAFE_FREE(faulty_eptes);
}


================================================
FILE: rvzr/executor_km/x86/perf_counters.c
================================================
/// File: Configuration and use of performance counters
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/msr-index.h>
#include <linux/kernel.h>
#include <linux/types.h>

#include "main.h"
#include "shortcuts.h"

#include "perf_counters.h"

struct pfc_config {
    unsigned long evt_num;
    unsigned long umask;
    unsigned long cmask;
    unsigned int any;
    unsigned int edge;
    unsigned int inv;
};

typedef enum {
    L1_HITS = 0,
    UOPS_ISSUED_ANY = 1,
    UOPS_RETIRED_ANY = 2,
    MISPREDICTION_RECOVERY_CYCLES = 3,
    HW_INTERRUPTS_RECEIVED = 4,
    SMI_INTERRUPTS_RECEIVED = 5,
    DECODE_REDIRECTS = 6
} pfc_name_e;

static int get_pfc_config_by_name(pfc_name_e pfc_name, struct pfc_config *config)
{
    uint64_t family = cpuinfo->x86;
    uint64_t model = cpuinfo->x86_model;

    // most commonly, the fields cmask, any, edge, and inv are set to 0
    config->cmask = 0;
    config->any = 0;
    config->edge = 0;
    config->inv = 0;

    // Intel PMU
    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        switch (pfc_name) {
        case L1_HITS:
            //   MEM_LOAD_RETIRED.L1_HIT: Counts retired load instructions with at least one uop
            //   that hit in the L1 data cache. This event includes all SW prefetches and lock
            //   instructions regardless of the data source.
            config->evt_num = 0xd1;
            config->umask = 0x01;
            break;
        case UOPS_ISSUED_ANY:
            //   UOPS_ISSUED.ANY: Counts the number of uops that the Resource Allocation Table (RAT)
            //   issues to the Reservation Station (RS).
            if (model == 0xBA || model == 0xB7 || model == 0xBF || model == 0x97 || model == 0x9A) {
                config->evt_num = 0xAE;
                config->umask = 0x01;
            } else {
                config->evt_num = 0x0E;
                config->umask = 0x01;
            }
            break;
        case UOPS_RETIRED_ANY:
            //   UOPS_RETIRED.RETIRE_SLOTS: Counts the retirement slots used.
            config->evt_num = 0xC2;
            config->umask = 0x02;
            break;
        case MISPREDICTION_RECOVERY_CYCLES:
            //   INT_MISC.CLEAR_RESTEER_CYCLES: Cycles the issue-stage is waiting for front-end to
            //   fetch from resteered path following branch misprediction or machine clear events.
            if (model == 0xBA || model == 0xB7 || model == 0xBF || model == 0x97 || model == 0x9A) {
                config->evt_num = 0xAD;
                config->umask = 0x80;
            } else {
                config->evt_num = 0x0D;
                config->umask = 0x01;
            }
            break;
        case HW_INTERRUPTS_RECEIVED:
            //   HW_INTERRUPTS.RECEIVED: Counts the number of hardware interruptions received by the
            //   processor.
            config->evt_num = 0xCB;
            config->umask = 0x01;
            break;
        default:
            return -1;
        }
        return 0;
    }

    // AMD PMU
    if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        switch (pfc_name) {
        case L1_HITS:
            switch (family) {
            case 0x1a:
            case 0x19:
                // Any Data Cache Fills by Data Source
                config->evt_num = 0x44;
                config->umask = 0xff;
                break;
            default:
                config->evt_num = 0x43;
                config->umask = 0xff;
            }
            break;
        case UOPS_ISSUED_ANY:
            // Dispatched ops
            switch (family) {
            case 0x17:
                // there's no reliable counter of dispatched ops on this family (at least that
                // I know of), so we use a dummy counter that always returns zero; this way,
                // we effectively disable the speculation filter
                config->evt_num = 0x00;
                config->umask = 0x00;
                break;
            default:
                config->evt_num = 0xAB;
                config->umask = 0xff;
            }
            break;
        case UOPS_RETIRED_ANY:
            // Retired ops
            config->evt_num = 0xC1;
            config->umask = 0x00;
            break;
        case MISPREDICTION_RECOVERY_CYCLES:
            // Decode redirects
            config->evt_num = 0x91;
            config->umask = 0x00;
            break;
        case SMI_INTERRUPTS_RECEIVED:
            // SMI monitoring
            config->evt_num = 0x2c;
            config->umask = 0x00;
            break;
        default:
            return -1;
        }
        return 0;
    }

    // unsupported vendor
    return -1;
}

/// @brief  Clears the programmable performance counters and writes the
///         configurations to the corresponding MSRs.
/// @param  void
/// @return 0 on success, -1 on failure
static int pfc_write(unsigned int id, struct pfc_config *config, unsigned int usr, unsigned int os)
{
    uint64_t perf_configuration = 0;
#if VENDOR_ID == 1
    uint64_t global_ctrl = native_read_msr(MSR_CORE_PERF_GLOBAL_CTRL);
    global_ctrl |= ((uint64_t)7 << 32) | 15;
    wrmsr64(MSR_CORE_PERF_GLOBAL_CTRL, global_ctrl);

    perf_configuration = native_read_msr(MSR_P6_EVNTSEL0 + id);

    // disable the counter
    perf_configuration &= ~(((uint64_t)1 << 32) - 1);
    wrmsr64(MSR_P6_EVNTSEL0 + id, perf_configuration);

    // clear
    wrmsr64(MSR_IA32_PERFCTR0 + id, 0ULL);

    perf_configuration |= ((config->cmask & 0xFF) << 24);
    perf_configuration |= (config->inv << 23);
    perf_configuration |= (1ULL << 22);
    perf_configuration |= (config->any << 21);
    perf_configuration |= (config->edge << 18);
    perf_configuration |= (os << 17);
    perf_configuration |= (usr << 16);
    perf_configuration |= ((config->umask & 0xFF) << 8);
    perf_configuration |= (config->evt_num & 0xFF);
    wrmsr64(MSR_P6_EVNTSEL0 + id, perf_configuration);
#elif VENDOR_ID == 2
    perf_configuration = 0;
    perf_configuration |= ((config->evt_num) & 0xF00) << 24;
    perf_configuration |= (config->evt_num) & 0xFF;
    perf_configuration |= ((config->umask) & 0xFF) << 8;
    perf_configuration |= ((config->cmask) & 0x7F) << 24;
    perf_configuration |= (config->inv << 23);
    perf_configuration |= (1ULL << 22);
    perf_configuration |= (config->edge << 18);
    perf_configuration |= (os << 17);
    perf_configuration |= (usr << 16);
    wrmsr64(MSR_F15H_PERF_CTL + 2 * id, perf_configuration);
#endif
    return 0;
}

int pfc_configure(void)
{
    int err = 0;
    struct pfc_config config = {0};

    // Configure PMU
    // #0:  Htrace collection
    err |= get_pfc_config_by_name(L1_HITS, &config);
    CHECK_ERR("pfc_configure");
    err |= pfc_write(0, &config, 1, 1);
    CHECK_ERR("pfc_configure");

    // #1: Fuzzing feedback
    err |= get_pfc_config_by_name(UOPS_ISSUED_ANY, &config);
    CHECK_ERR("pfc_configure");
    err |= pfc_write(1, &config, 1, 1);
    CHECK_ERR("pfc_configure");

    // #2: Fuzzing feeback
    err |= get_pfc_config_by_name(UOPS_RETIRED_ANY, &config);
    CHECK_ERR("pfc_configure");
    err |= pfc_write(2, &config, 1, 1);
    CHECK_ERR("pfc_configure");

    // #3: Fuzzing feedback
    err |= get_pfc_config_by_name(MISPREDICTION_RECOVERY_CYCLES, &config);
    CHECK_ERR("pfc_configure");
    err |= pfc_write(3, &config, 1, 1);
    CHECK_ERR("pfc_configure");

    // #4: Interrupt detection
    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        err |= get_pfc_config_by_name(HW_INTERRUPTS_RECEIVED, &config);
        CHECK_ERR("pfc_configure");
        err |= pfc_write(4, &config, 1, 1);
        CHECK_ERR("pfc_configure");
    }

    // #5: SMI monitoring
    if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        err |= get_pfc_config_by_name(SMI_INTERRUPTS_RECEIVED, &config);
        CHECK_ERR("pfc_configure");
        err |= pfc_write(5, &config, 1, 1);
        CHECK_ERR("pfc_configure");
    }

    return err;
}

// =================================================================================================
int init_perf_counters(void) { return 0; }
void free_perf_counters(void) {}


================================================
FILE: rvzr/executor_km/x86/registers.h
================================================
/// File: Symbolic names for pre-allocated registers; x86-64 version
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef X86_REGISTERS_H_
#define X86_REGISTERS_H_

// Register IDs
#define RAX_REG_ID 0x0
#define RCX_REG_ID 0x1
#define RDX_REG_ID 0x2
#define RBX_REG_ID 0x3
#define RSP_REG_ID 0x4
#define RBP_REG_ID 0x5
#define RSI_REG_ID 0x6
#define RDI_REG_ID 0x7

#define REX_BOUNDARY 0x8
#define R8_REG_ID    0x8
#define R9_REG_ID    0x9
#define R10_REG_ID   0xa
#define R11_REG_ID   0xb
#define R12_REG_ID   0xc
#define R13_REG_ID   0xd
#define R14_REG_ID   0xe
#define R15_REG_ID   0xf

/// Reserved registers
#define STATUS_REGISTER    "r12"
#define STATUS_REGISTER_32 "r12d"
#define STATUS_REGISTER_8  "r12b"

#define HTRACE_REGISTER "r13"
#define MEMORY_BASE_REG "r14"
#define UTIL_BASE_REG   "r15"

#define TMP_REG    "r11" // temporary register for various uses
#define TMP_REG_ID (R11_REG_ID)

/// Performance counter registers
#define PFC0 "r10"
#define PFC1 "r9"
#define PFC2 "r8"

#endif // X86_REGISTERS_H_


================================================
FILE: rvzr/executor_km/x86/special_registers.c
================================================
/// File:
///  - Management of model-specific registers (MSRs)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/msr-index.h>

#include "fault_handler.h"
#include "main.h"
#include "shortcuts.h"
#include "special_registers.h"
#include "test_case_parser.h"

special_registers_t *orig_special_registers_state = NULL; // global

// =================================================================================================
// Local shortcuts to read/write special registers
// =================================================================================================
/// Note: we intentionally don't use the native_read/write_cr0/4 functions here for long-term
/// stability, because their signatures may change between kernel versions

static inline unsigned long _read_cr0(void)
{
    unsigned long val = 0;
    asm volatile("mov %%cr0, %0\n" : "=r"(val));
    return val;
}

static inline void _write_cr0(unsigned long val) { asm volatile("mov %0, %%cr0\n" : : "r"(val)); }

static inline unsigned long _read_cr4(void)
{
    unsigned long val = 0;
    asm volatile("mov %%cr4, %0\n" : "=r"(val));
    return val;
}

static inline void _write_cr4(unsigned long val) { asm volatile("mov %0, %%cr4\n" : : "r"(val)); }

// =================================================================================================
// Private implementation of special register management
// =================================================================================================

static int store_orig_msr_state(void);

static int set_msrs_for_user_actors(void)
{
#ifdef FORCE_SMAP_OFF
    uint64_t cr4 = _read_cr4();
    cr4 &= ~(X86_CR4_SMAP | X86_CR4_SMEP);
    asm volatile("mov %0, %%cr4" : : "r"(cr4)); // use asm to bypass checks
#endif
    // set default syscall entry point
    wrmsr64(MSR_LSTAR, (uint64_t)fault_handler);

    return 0;
}

/// @brief Configure MSRs to enable VMX operation
/// @param void
/// @return 0 on success, -1 on failure
static int set_msrs_for_vmx(void)
{
    uint64_t cr4 = _read_cr4();
    uint64_t cr0 = _read_cr0();

    // Ensure bits in CR0 and CR4 are valid in VMX operation:
    // - Bit X is 1 in _FIXED0: bit X is fixed to 1 in CRx.
    // - Bit X is 0 in _FIXED1: bit X is fixed to 0 in CRx.
    // (source: SDM, 24.8 "restrictions on VMX operation")
    cr0 &= rdmsr64(MSR_IA32_VMX_CR0_FIXED1);
    cr0 |= rdmsr64(MSR_IA32_VMX_CR0_FIXED0);
    cr4 &= rdmsr64(MSR_IA32_VMX_CR4_FIXED1);
    cr4 |= rdmsr64(MSR_IA32_VMX_CR4_FIXED0);
    _write_cr0(cr0);

    // Enable VMX operation:
    // (source: SDM, 24.7 "Enabling and entering VMX operation")
    // - CR4.VMXE = 1
    cr4 |= X86_CR4_VMXE;
    _write_cr4(cr4);

    return 0;
}

/// @brief Configure MSRs to enable SVM operation
/// @param void
/// @return 0 on success, -1 on failure
static int set_msrs_for_svm(void)
{
    // Ensure SVM is not disabled in BIOS
    uint64_t vm_cr = rdmsr64(MSR_VM_CR);
    ASSERT((vm_cr & (1 << 4)) == 0, "set_msrs_for_svm");

    // Enable SVM operation
    uint64_t efer = rdmsr64(MSR_EFER);
    if (!(efer & EFER_SVME)) {
        efer |= EFER_SVME;
        wrmsr64(MSR_EFER, efer);
    }

    return 0;
}

static int get_ssbp_patch_msr_ctrls(uint64_t *msr_id, uint64_t *msr_mask)
{
    if (cpu_has(cpuinfo, X86_FEATURE_MSR_SPEC_CTRL)) {
        *msr_id = MSR_IA32_SPEC_CTRL;
        *msr_mask = SPEC_CTRL_SSBD;
    } else if (cpu_has(cpuinfo, X86_FEATURE_VIRT_SSBD)) {
        *msr_id = MSR_AMD64_VIRT_SPEC_CTRL;
        *msr_mask = SPEC_CTRL_SSBD;
    } else if (cpu_has(cpuinfo, X86_FEATURE_LS_CFG_SSBD)) {
        *msr_id = MSR_AMD64_LS_CFG;
        switch (cpuinfo->x86) {
        case 0x15:
            *msr_mask = 1ULL << 54;
            break;
        case 0x16:
            *msr_mask = 1ULL << 33;
            break;
        case 0x17:
            *msr_mask = 1ULL << 10;
            break;
        default:
            PRINT_ERR("ERROR: Unable to patch SSBD on this CPU; unexpected CPU model\n");
            return -1;
        }
    } else {
        PRINT_ERR("ERROR: Unable to patch SSBD on this CPU; no known patch\n");
        return -1;
    }
    return 0;
}

static int get_prefetcher_msr_ctrls(uint64_t *msr_id, uint64_t *msr_mask)
{
    if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
        *msr_id = MSR_MISC_FEATURE_CONTROL;
        switch (cpuinfo->x86_model) {
        case 0x97:
        case 0x9a:
        case 0xba:
        case 0xb7:
        case 0xbf:
            *msr_mask = 0b101111;
            break;
        default:
            *msr_mask = 0b1111;
            break;
        }
    } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
        switch (cpuinfo->x86) {
        case 0x19:
            *msr_id = 0xc0000108;
            *msr_mask = 0b101111;
            break;
        default:
            *msr_id = MSR_AMD64_DC_CFG;
            *msr_mask = (1 << 13) | (1 << 15);
            break;
        }
    }
    return 0;
}

static int apply_msr_mask(uint64_t msr_id, uint64_t msr_mask, bool enable)
{
    uint64_t msr_value = rdmsr64(msr_id);
    if (enable) {
        msr_value |= msr_mask;
    } else {
        msr_value &= ~msr_mask;
    }
    wrmsr64(msr_id, msr_value);
    if (rdmsr64(msr_id) != msr_value) {
        PRINT_ERR("ERROR: Not able to set MSR 0x%llx\n", msr_id);
        return -1;
    }
    return 0;
}

// =================================================================================================
// Public interface to special register management
// =================================================================================================

int set_special_registers(void)
{
    int err = 0;
    uint64_t msr_id = 0, msr_mask = 0;

    err = store_orig_msr_state();
    CHECK_ERR("store_orig_msr_state");

#ifndef VMBUILD
    // Speculative Store Bypass (SSBP) patch
    err = get_ssbp_patch_msr_ctrls(&msr_id, &msr_mask);
    orig_special_registers_state->spec_ctrl = rdmsr64(msr_id);
    CHECK_ERR("set_enable_ssbp_patch");
    err = apply_msr_mask(msr_id, msr_mask, enable_ssbp_patch);
    CHECK_ERR("set_enable_ssbp_patch");

    // Prefetcher control
    err = get_prefetcher_msr_ctrls(&msr_id, &msr_mask);
    orig_special_registers_state->prefetcher_ctrl = rdmsr64(msr_id);
    CHECK_ERR("set_disable_prefetchers");
    err = apply_msr_mask(msr_id, msr_mask, !enable_prefetchers); // the mask is
    CHECK_ERR("set_disable_prefetchers");
#endif

    // CR0
    uint64_t cr0 = _read_cr0();
    cr0 &= ~X86_CR0_CD; // enable caching; required for collecting traces
    _write_cr0(cr0);

    // CR4
    uint64_t cr4 = _read_cr4();
    cr4 |= X86_CR4_PCE; // enable performance counters
    _write_cr4(cr4);

    if (test_case->features.includes_user_actors) {
        err = set_msrs_for_user_actors();
        CHECK_ERR("set_msrs_for_user_actors");
    }

    if (test_case->features.includes_vm_actors) {
        if (cpuinfo->x86_vendor == X86_VENDOR_INTEL) {
            err = set_msrs_for_vmx();
        } else if (cpuinfo->x86_vendor == X86_VENDOR_AMD) {
            err = set_msrs_for_svm();
        }
        CHECK_ERR("set_msrs_for_vm_actors");
    }

    return 0;
}

static int store_orig_msr_state(void)
{
    orig_special_registers_state->cr0 = _read_cr0();
    orig_special_registers_state->cr4 = _read_cr4();
    orig_special_registers_state->lstar = rdmsr64(MSR_LSTAR);
    orig_special_registers_state->efer = rdmsr64(MSR_EFER);
    orig_special_registers_state->fs_base = rdmsr64(MSR_FS_BASE);
    orig_special_registers_state->gs_base = rdmsr64(MSR_GS_BASE);

    struct desc_ptr gdtr;
    asm volatile("sgdt %0" : "=m"(gdtr));
    orig_special_registers_state->gdtr_base = gdtr.address;
    orig_special_registers_state->gdtr_limit = gdtr.size;

#if VENDOR_ID == VENDOR_AMD_ // AMD
    orig_special_registers_state->syscfg = rdmsr64(MSR_SYSCFG);
#endif
    return 0;
}

void restore_special_registers(void)
{
    uint64_t msr_id = 0, msr_mask = 0;

    // note: the if-zero statements are necessary because the MSR initialization might have failed
    // midway through the process, in which case the MSR state was only partially initialized

    if (orig_special_registers_state->cr0 != 0)
        _write_cr0(orig_special_registers_state->cr0);

    if (orig_special_registers_state->cr4 != 0)
        _write_cr4(orig_special_registers_state->cr4);

    if (orig_special_registers_state->efer != 0)
        wrmsr64(MSR_EFER, orig_special_registers_state->efer);

    if (orig_special_registers_state->lstar != 0)
        wrmsr64(MSR_LSTAR, orig_special_registers_state->lstar);

    if (orig_special_registers_state->spec_ctrl != 0) {
        get_ssbp_patch_msr_ctrls(&msr_id, &msr_mask);
        wrmsr64(msr_id, orig_special_registers_state->spec_ctrl);
    }

    if (orig_special_registers_state->prefetcher_ctrl != 0) {
        get_prefetcher_msr_ctrls(&msr_id, &msr_mask);
        wrmsr64(msr_id, orig_special_registers_state->prefetcher_ctrl);
    }

    if (orig_special_registers_state->fs_base != 0) {
        wrmsr64(MSR_FS_BASE, orig_special_registers_state->fs_base);
    }

    if (orig_special_registers_state->gs_base != 0) {
        wrmsr64(MSR_GS_BASE, orig_special_registers_state->gs_base);
    }

    if (orig_special_registers_state->gdtr_base != 0) {
        struct desc_ptr gdtr = {.address = orig_special_registers_state->gdtr_base,
                                .size = orig_special_registers_state->gdtr_limit};
        asm volatile("lgdt %0" : : "m"(gdtr));
    }

#if VENDOR_ID == VENDOR_AMD_ // AMD
    if (orig_special_registers_state->syscfg != 0)
        wrmsr64(MSR_SYSCFG, orig_special_registers_state->syscfg);
#endif

    memset(orig_special_registers_state, 0, sizeof(special_registers_t));
}

// =================================================================================================
int init_special_register_manager(void)
{
    orig_special_registers_state = CHECKED_ZALLOC(sizeof(special_registers_t));
    return 0;
}

void free_special_register_manager(void) { SAFE_FREE(orig_special_registers_state); }


================================================
FILE: rvzr/executor_km/x86/svm.c
================================================
/// File: Configuration and use of AMD SVM
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <linux/types.h>

#include "actor.h"
#include "shortcuts.h"

#include "fault_handler.h"
#include "hardware_desc.h"
#include "main.h"
#include "page_tables_guest.h"
#include "special_registers.h"
#include "svm.h"
#include "svm_constants.h"

bool svm_is_on = false; // global
uint64_t *vmcb_hpas;    // global
uint64_t *vmcb_hvas;    // global

static struct page *host_ssa_page = NULL;
static char *host_ssa_hva = NULL;
static uint64_t orig_host_ssa_hpa = 0;

static struct page *vmcb_pages = NULL;

static void *iopm_hva = NULL;
static uint64_t iopm_hpa = 0;

static void *msrpm_hva = NULL;
static uint64_t msrpm_hpa = 0;

static int set_vmcb_guest_state(vmcb_t *vmcb_hva);
static int set_vmcb_control(vmcb_t *vmcb_hva, uint64_t actor_id);

// =================================================================================================
// Helper functions
// =================================================================================================
#define _BITU(x) (1U << (x))

/// @brief Initialize a segment
/// See arch/x86/svm.c for original implementation
/// @param seg The segment to initialize
inline static void init_seg(seg_t *seg, uint16_t selector, uint64_t base, uint32_t limit,
                            uint16_t attrib)
{
    seg->selector = selector;
    seg->attrib = attrib;
    seg->limit = limit;
    seg->base = base;
}

/// @brief Initialize a system segment
/// See arch/x86/svm.c for original implementation
/// @param seg The segment to initialize
/// @param type Segment attributes
static void init_sys_seg(seg_t *seg, uint32_t type)
{
    seg->selector = 0;
    seg->attrib = SVM_SELECTOR_P_MASK | type;
    seg->limit = 0xffff;
    seg->base = 0;
}

// =================================================================================================
// SVM management interface
// (functions exposed to the rest of the executor)
// =================================================================================================

/// @brief Check whether the target CPU is compatible with our implementation of SVM management
/// @return 0 is compatible, -1 otherwise
int svm_check_cpu_compatibility(void)
{
    ASSERT_MSG(cpu_has(cpuinfo, X86_FEATURE_SVM), "svm_check_cpu_compatibility",
               "SVM is not supported on this CPU");

    // Control registers
    uint64_t cr0 = read_cr0();
    uint64_t cr4 = __read_cr4();
    uint64_t efer = rdmsr64(MSR_EFER);
    ASSERT((cr0 & X86_CR0_CD) == 0, "set_vmcb_guest_state");
    ASSERT((cr0 & X86_CR0_NW) == 0, "set_vmcb_guest_state");
    ASSERT((cr0 & X86_CR0_PE) != 0, "set_vmcb_guest_state");
    ASSERT((cr0 & X86_CR0_PG) != 0, "set_vmcb_guest_state");
    ASSERT((cr4 & X86_CR4_PAE) != 0, "set_vmcb_guest_state");
    ASSERT((efer & EFER_LME) != 0, "set_vmcb_guest_state");
    ASSERT((efer & EFER_LMA) != 0, "set_vmcb_guest_state");

    // SNP is not supported
    uint64_t syscfg = rdmsr64(MSR_SYSCFG);
    ASSERT((syscfg & _BITULL(24)) == 0, "set_vmcb_guest_state");

    return 0;
}

/// @brief Enable SVM operation
/// @return 0 on success, negative error code on failure
int start_svm_operation(void)
{
    // Note that EFER.SVME is already set in special_registers.c

    // Store the original Host State Save Area
    orig_host_ssa_hpa = rdmsr64(MSR_VM_HSAVE_PA);

    // Prepare Host State Save Area
    memset(host_ssa_hva, 0, PAGE_SIZE);
    wrmsr64(MSR_VM_HSAVE_PA, page_to_pfn(host_ssa_page) << PAGE_SHIFT);
    ((uint64_t *)host_ssa_hva)[0] = 0x42;

    svm_is_on = true;

    return 0;
}

/// @brief Disable SVM operation
/// Should never fail as this function can be used in exception handlers;
/// instead, it will print warning upon error.
/// @return void
void stop_svm_operation(void)
{
    // Restore the original Host State Save Area
    wrmsr64(MSR_VM_HSAVE_PA, orig_host_ssa_hpa);

    svm_is_on = false;
}

/// @brief Restore the VMCB state that was active when we started
/// @param void
/// @return 0 on success, negative error code on failure
int store_orig_vmcb_state(void) { return 0; }

/// @brief Restore the VMCB state that was active when we started
/// Should never fail as this function can be used in exception handlers;
/// instead, it prints warnings upon errors.
/// @return void
void restore_orig_vmcb_state(void) {}

/// @brief Configure VMCBs for all guest actors
/// @param void
/// @return 0 on success, negative error code on failure
int set_vmcb_state(void)
{
    int err = 0;

    // initialize VMCBs for all guest actors
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-guest actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        struct page *vmcb_page = &vmcb_pages[actor_id];
        vmcb_t *vmcb_hva = page_address(vmcb_page);
        vmcb_hvas[actor_id] = (uint64_t)vmcb_hva;
        vmcb_hpas[actor_id] = page_to_pfn(vmcb_page) << PAGE_SHIFT;

        ASSERT(vmcb_hpas[actor_id] != 0, "set_vmcb_state");
        ASSERT((vmcb_hpas[actor_id] & 0xFFF) == 0, "set_vmcb_state");

        // reset VMCB
        memset(vmcb_hva, 0, VMCB_SIZE);

        // set VMCB fields
        err = set_vmcb_guest_state(vmcb_hva);
        CHECK_ERR("set_vmcb_state");

        err = set_vmcb_control(vmcb_hva, actor_id);
        CHECK_ERR("set_vmcb_state");
    }

    return 0;
}

static int set_vmcb_guest_state(vmcb_t *vmcb_hva)
{
    int err = 0;
    vmcb_save_t *save = &vmcb_hva->save;
    guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
    guest_memory_t *guest_p_memory = (guest_memory_t *)(GUEST_P_MEMORY_START);

    // - Control registers
    save->cr0 = (read_cr0() | MUST_SET_BITS_CR0_SVM_GUEST) & ~MUST_CLEAR_BITS_CR0_SVM_GUEST;
    save->cr3 = (uint64_t)&guest_p_memory->guest_page_tables.l4[0];
    save->cr4 = (__read_cr4() | MUST_SET_BITS_CR4_SVM_GUEST) & ~MUST_CLEAR_BITS_CR4_SVM_GUEST;
    save->efer =
        (rdmsr64(MSR_EFER) | MUST_SET_BITS_EFER_SVM_GUEST) & ~MUST_CLEAR_BITS_EFER_SVM_GUEST;

    // - Debug registers
    save->dr7 = 0x400;
    save->dr6 = 0;

    // - GPRs
    save->rip = (uint64_t)&guest_v_memory->code.section[0];
    save->rsp = (uint64_t)&guest_v_memory->data.main_area[LOCAL_RSP_OFFSET];
    save->rflags = X86_EFLAGS_FIXED;
    save->rax = 0;

    // - Segment registers (values mainly based on https://www.sandpile.org/x86/initial.htm)
    init_seg(&save->cs, 0x10, 0, 0xffffffff, MUST_SET_BITS_CS_SVM_GUEST);
    init_seg(&save->ss, 0x20, 0, 0xffffffff, MUST_SET_BITS_SS_SVM_GUEST);
    init_seg(&save->ds, 0, 0, 0xffffffff, MUST_SET_BITS_DS_SVM_GUEST);
    init_seg(&save->es, 0, 0, 0xffffffff, 0);
    init_seg(&save->fs, 0, 0, 0xffffffff, 0);
    init_seg(&save->gs, 0, 0, 0xffffffff, 0);

    init_sys_seg(&save->ldtr, 2);
    init_sys_seg(&save->tr, 3);

    // - GDTR and IDTR (left empty for the time being; attempt to use will cause VM exit)
    save->gdtr.base = (uint64_t)&guest_v_memory->gdt;
    save->gdtr.limit = 0xffff;
    save->idtr.base = 0;
    save->idtr.limit = 0xffff;

    // MSRs
    save->dbgctl = 0;
    save->sysenter_cs = 0x10;
    // save->sysenter_cs = rdmsr64(MSR_IA32_SYSENTER_CS);
    save->sysenter_esp = (uint64_t)&guest_v_memory->data.main_area[LOCAL_RSP_OFFSET];
    // save->sysenter_esp = rdmsr64(MSR_IA32_SYSENTER_ESP);
    save->sysenter_eip = (uint64_t)&guest_v_memory->code.section[0];
    // save->sysenter_eip = rdmsr64(MSR_IA32_SYSENTER_EIP);

    save->kernel_gs_base = rdmsr64(MSR_KERNEL_GS_BASE);
    save->star = rdmsr64(MSR_STAR);
    save->lstar = rdmsr64(MSR_LSTAR);
    save->cstar = rdmsr64(MSR_CSTAR);
    save->sfmask = rdmsr64(MSR_SYSCALL_MASK);

    // Performance counters
    save->perf_ctl0 = rdmsr64(MSR_F15H_PERF_CTL0);
    save->perf_ctr0 = rdmsr64(MSR_F15H_PERF_CTR0);
    save->perf_ctl1 = rdmsr64(MSR_F15H_PERF_CTL1);
    save->perf_ctr1 = rdmsr64(MSR_F15H_PERF_CTR1);
    save->perf_ctl2 = rdmsr64(MSR_F15H_PERF_CTL2);
    save->perf_ctr2 = rdmsr64(MSR_F15H_PERF_CTR2);
    save->perf_ctl3 = rdmsr64(MSR_F15H_PERF_CTL3);
    save->perf_ctr3 = rdmsr64(MSR_F15H_PERF_CTR3);

    // Privilege level
    save->cpl = 0;

    // PAT
    uint64_t pat = 0;
    for (int i = 0; i < 8; i++) {
        pat |= (uint64_t)0x06 << (i * 8);
    }
    save->g_pat = pat;
    return err;
}

static int set_vmcb_control(vmcb_t *vmcb_hva, uint64_t actor_id)
{
    int err = 0;
    vmcb_control_t *ctrl = &vmcb_hva->control;

    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR0_READ);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR3_READ);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR4_READ);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR8_READ);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR0_WRITE);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR3_WRITE);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR4_WRITE);
    ctrl->intercept_cr |= _BITU(VMCB_INTERCEPT_CR8_WRITE);

    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR0_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR1_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR2_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR3_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR4_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR5_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR6_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR7_READ);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR0_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR1_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR2_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR3_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR4_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR5_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR6_WRITE);
    ctrl->intercept_dr |= _BITU(VMCB_INTERCEPT_DR7_WRITE);

    ctrl->intercept_exceptions = 0XFFFFFFFF;

    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_NMI);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_SMI);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INIT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_VINTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_SELECTIVE_CR0);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_STORE_IDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_STORE_GDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_STORE_LDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_STORE_TR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_LOAD_IDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_LOAD_GDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_LOAD_LDTR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_LOAD_TR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_CPUID);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_RSM);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_IRET);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INTn);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INVD);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_PAUSE);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_HLT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INVLPG);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_INVLPGA);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_IOIO_PROT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_MSR_PROT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_TASK_SWITCH);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_FERR_FREEZE);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_SHUTDOWN);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_VMRUN);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_VMMCALL);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_VMLOAD);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_VMSAVE);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_STGI);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_CLGI);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_SKINIT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_ICEBP);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_WBINVD);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_MONITOR);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_MWAIT);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_MWAIT_COND);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_XSETBV);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_RDPRU);
    ctrl->intercept |= _BITULL(VMCB_INTERCEPT_EFER_WRITE);
    // DO NOT SET the following bits! Required for htrace collection
    // ctrl->intercept |= _BITULL(VMCB_INTERCEPT_PUSHF);
    // ctrl->intercept |= _BITULL(VMCB_INTERCEPT_POPF);
    // ctrl->intercept |= _BITULL(VMCB_INTERCEPT_RDTSC);
    // ctrl->intercept |= _BITULL(VMCB_INTERCEPT_RDPMC);
    // ctrl->intercept |= _BITULL(VMCB_INTERCEPT_RDTSCP);

    ctrl->intercept_ext |= _BITULL(VMCB_INTERCEPT_ALL_INVLPGB);
    ctrl->intercept_ext |= _BITULL(VMCB_INTERCEPT_INVPCID);
    ctrl->intercept_ext |= _BITULL(VMCB_INTERCEPT_MCOMMIT);
    ctrl->intercept_ext |= _BITULL(VMCB_INTERCEPT_TLBSYNC);
    ctrl->intercept_ext |= _BITULL(VMCB_INTERCEPT_BUS_LOCK);

    ctrl->pause_filter_count = 0;
    ctrl->pause_filter_thresh = 0;

    ctrl->iopm_base_pa = iopm_hpa;
    ASSERT(ctrl->iopm_base_pa < MAX_PHYSICAL_ADDRESS, "set_vmcb_control");

    ctrl->msrpm_base_pa = msrpm_hpa;
    ASSERT(ctrl->msrpm_base_pa < MAX_PHYSICAL_ADDRESS, "set_vmcb_control");

    ctrl->tsc_offset = 0;

    ctrl->asid = (uint32_t)actor_id;

    ctrl->tlb_ctl = 0;
    ctrl->int_ctl = V_INTR_MASKING_MASK;
    ctrl->int_vector = 0;
    ctrl->int_state = 0;

    ctrl->nested_ctl |= SVM_NESTED_CTL_NP_ENABLE;
    ctrl->nested_ctl |= _BITULL(6); // Read-only guest page tables

    ctrl->nested_cr3 = (((uint64_t)ept_ptr[actor_id].paddr) << 12);
    ASSERT(ctrl->nested_cr3 < MAX_PHYSICAL_ADDRESS, "set_vmcb_control");

    ctrl->exit_code = 0x42;

    ctrl->clean = 0;

    return err;
}

/// @brief Print information about the last VM exit
/// @param void
/// @return 0 on success, negative error code on failure
int print_svm_exit_info(void)
{
    int err = 0;

    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-guest actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        struct page *vmcb_page = &vmcb_pages[actor_id];
        vmcb_t *vmcb_hva = page_address(vmcb_page);

        uint64_t exitcode = vmcb_hva->control.exit_code;
        uint64_t exitinfo1 = vmcb_hva->control.exit_info_1;
        uint64_t exitinfo2 = vmcb_hva->control.exit_info_2;
        uint64_t exitintinfo = vmcb_hva->control.exit_int_info;

        // print exit information
        printk(
            KERN_ERR
            "VMCB[%d]: exitcode=0x%llx, exitinfo1=0x%llx, exitinfo2=0x%llx, exitintinfo=0x%llx\n",
            actor_id, exitcode, exitinfo1, exitinfo2, exitintinfo);
        printk(KERN_ERR "insn_len=0x%x, insn_bytes=0x%llx\n", vmcb_hva->control.insn_len,
               *(uint64_t *)(&vmcb_hva->control.insn_bytes[0]));
    }

    return err;
}

// =================================================================================================
int init_svm(void)
{
    int err = 0;

    // VMCBs
    vmcb_pages = CHECKED_ALLOC_PAGES(SVM_MAX_NUM_GUESTS * VMCB_SIZE);
    vmcb_hpas = CHECKED_ZALLOC(SVM_MAX_NUM_GUESTS * sizeof(uint64_t));
    vmcb_hvas = CHECKED_ZALLOC(SVM_MAX_NUM_GUESTS * sizeof(uint64_t));

    // host state save area
    host_ssa_page = alloc_page(GFP_KERNEL);
    if (!host_ssa_page)
        return -ENOMEM;
    host_ssa_hva = page_address(host_ssa_page);

    // IOPM
    struct page *iopm_pages = alloc_pages(GFP_KERNEL, 2);
    if (!iopm_pages)
        return -ENOMEM;
    iopm_hva = page_address(iopm_pages);
    memset(iopm_hva, 0xff, PAGE_SIZE * 4);
    iopm_hpa = page_to_pfn(iopm_pages) << PAGE_SHIFT;

    // MSRPM
    struct page *msrpm_pages = alloc_pages(GFP_KERNEL, 1);
    if (!msrpm_pages)
        return -ENOMEM;
    msrpm_hva = page_address(msrpm_pages);
    memset(msrpm_hva, 0xff, PAGE_SIZE * 2);
    msrpm_hpa = page_to_pfn(msrpm_pages) << PAGE_SHIFT;

    return err;
}

void free_svm(void)
{
    SAFE_PAGES_FREE(vmcb_pages, SVM_MAX_NUM_GUESTS * VMCB_SIZE);
    SAFE_FREE(vmcb_hpas);
    SAFE_FREE(vmcb_hvas);

    if (host_ssa_page) {
        __free_page(host_ssa_page);
        host_ssa_page = NULL;
        host_ssa_hva = NULL;
    }

    if (iopm_hva) {
        __free_pages(virt_to_page(iopm_hva), 2);
        iopm_hva = NULL;
        iopm_hpa = 0;
    }

    if (msrpm_hva) {
        __free_pages(virt_to_page(msrpm_hva), 1);
        msrpm_hva = NULL;
        msrpm_hpa = 0;
    }
}


================================================
FILE: rvzr/executor_km/x86/vmx.c
================================================
/// File: Configuration and use of Intel VMX
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <asm/io.h>
#include <asm/msr-index.h>
#include <asm/processor-flags.h>
#include <asm/tlbflush.h>
#include <linux/types.h>

#include "actor.h"
#include "shortcuts.h"

#include "fault_handler.h"
#include "main.h"
#include "page_tables_guest.h"
#include "special_registers.h"
#include "vmx.h"
#include "vmx_config.h"

// NOLINTBEGIN(readability-function-size)
// NOLINTBEGIN(readability-function-cognitive-complexity)
// Justification: these functions directly follow VMX implementation steps as per Intel SDM;
// therefore, they are allowed to be complex

#define CHECK_VMFAIL(src)                                                                          \
    ASSERT(err_inv == 0, src);                                                                     \
    ASSERT(err_val == 0, src);

bool vmx_is_on = false;     // global
uint64_t *vmcs_hpas = NULL; // global

static bool orig_vmxon_state = false;
static uint64_t orig_vmcs_ptr = 0;

static void *vmxon_page_hva = NULL;
static uint64_t vmxon_page_hpa = 0;

static vmcs_t *vmcss = NULL;

static uint64_t supported_vmcs_pin_ctrl = 0;
static uint64_t supported_vmcs_primary_ctrl = 0;
static uint64_t supported_vmcs_secondary_ctrl = 0;

static int set_vmcs_guest_state(void);
static int set_vmcs_host_state(void);
static int set_vmcs_exec_control(int actor_id);
static int set_vmcs_exit_control(void);
static int set_vmcs_entry_control(void);
static int make_vmcs_launched(int actor_id);
static void print_vmlaunch_error_info(int err_inv, int err_val, int actor_id);

// =================================================================================================
// Error decoding
// =================================================================================================
static const char *vmx_instruction_error_to_str[] = {
    "Unknown error: 0",
    "VMXERR_VMCALL_IN_VMX_ROOT_OPERATION",
    "VMXERR_VMCLEAR_INVALID_ADDRESS",
    "VMXERR_VMCLEAR_VMXON_POINTER",
    "VMXERR_VMLAUNCH_NONCLEAR_VMCS",
    "VMXERR_VMRESUME_NONLAUNCHED_VMCS",
    "VMXERR_VMRESUME_AFTER_VMXOFF",
    "VMXERR_ENTRY_INVALID_CONTROL_FIELD",
    "VMXERR_ENTRY_INVALID_HOST_STATE_FIELD",
    "VMXERR_VMPTRLD_INVALID_ADDRESS",
    "VMXERR_VMPTRLD_VMXON_POINTER",
    "VMXERR_VMPTRLD_INCORRECT_VMCS_REVISION_ID",
    "VMXERR_UNSUPPORTED_VMCS_COMPONENT",
    "VMXERR_VMWRITE_READ_ONLY_VMCS_COMPONENT",
    "VMXERR_VMXON_IN_VMX_ROOT_OPERATION",
    "VMXERR_ENTRY_INVALID_EXECUTIVE_VMCS_POINTER",
    "VMXERR_ENTRY_NONLAUNCHED_EXECUTIVE_VMCS",
    "VMXERR_ENTRY_EXECUTIVE_VMCS_POINTER_NOT_VMXON_POINTER",
    "VMXERR_VMCALL_NONCLEAR_VMCS",
    "VMXERR_VMCALL_INVALID_VM_EXIT_CONTROL_FIELDS",
    "VMXERR_VMCALL_INCORRECT_MSEG_REVISION_ID",
    "VMXERR_VMXOFF_UNDER_DUAL_MONITOR_TREATMENT_OF_SMIS_AND_SMM",
    "VMXERR_VMCALL_INVALID_SMM_MONITOR_FEATURES",
    "VMXERR_ENTRY_INVALID_VM_EXECUTION_CONTROL_FIELDS_IN_EXECUTIVE_VMCS",
    "VMXERR_ENTRY_EVENTS_BLOCKED_BY_MOV_SS",
    "VMXERR_INVALID_OPERAND_TO_INVEPT_INVVPID",
    NULL};

typedef struct {
    uint16_t basic_exit_reason;
    const char *str;
} vmx_basic_exit_reason_t;

static vmx_basic_exit_reason_t vmx_basic_exit_reason_to_str[] = {VMX_EXIT_REASONS, {0, NULL}};

// =================================================================================================
// Helper functions
// =================================================================================================
/// @brief Runs VMXON and indicates whether it failed
/// @param err_inv Set if VMXOFF failed due to VMfailInvalid
/// @param err_val Set if VMXOFF failed due to VMfailValid
static inline void vmxon(uint64_t phys, uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, val = 0;
    __asm__ __volatile__("vmxon %[pa]; setc %[inval]; setz %[val]\n"
                         : [val] "=rm"(val), [inval] "=rm"(inv)
                         : [pa] "m"(phys)
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = val;
}

/// @brief Runs VMXOFF and indicates whether it failed
/// @param err_inv Set if VMXOFF failed due to VMfailInvalid
/// @param err_val Set if VMXOFF failed due to VMfailValid
static inline void vmxoff(uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, val = 0;
    __asm__ __volatile__("vmxoff; setc %[inval]; setz %[val]\n"
                         : [val] "=rm"(val), [inval] "=rm"(inv)
                         :
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = val;
}

static inline void vmptrst(uint64_t *dest, uint8_t *err_inv, uint8_t *err_val)
{
    uint64_t tmp = 0;
    uint8_t inv = 0, val = 0;
    __asm__ __volatile__("vmptrst %[tmp]; setc %[inval]; setz %[val]\n"
                         : [tmp] "=m"(tmp), [val] "=rm"(val), [inval] "=rm"(inv)
                         :
                         : "cc", "memory");
    *dest = tmp;
    *err_inv = inv;
    *err_val = val;
}

static inline void vmptrld(uint64_t vmcs_hpa, uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, val = 0;
    __asm__ __volatile__("vmptrld %[pa]; setc %[inval]; setz %[val]\n"
                         : [val] "=rm"(val), [inval] "=rm"(inv)
                         : [pa] "m"(vmcs_hpa)
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = val;
}

static inline void vmclear(uint64_t vmcs_hpa, uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, val = 0;
    __asm__ __volatile__("vmclear %[pa]; setc %[inval]; setz %[val]\n"
                         : [val] "=rm"(val), [inval] "=rm"(inv)
                         : [pa] "m"(vmcs_hpa)
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = val;
}

static inline void vmread(uint64_t field, uint64_t *dest, uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, val = 0;
    uint64_t dest_local = 0;
    __asm__ __volatile__("vmread %[field], %[dest]; setc %[inval]; setz %[val]\n"
                         : [dest] "=rm"(dest_local), [val] "=rm"(val), [inval] "=rm"(inv)
                         : [field] "r"(field)
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = val;
    *dest = dest_local;
}

static inline void vmwrite(uint64_t field, uint64_t value, uint8_t *err_inv, uint8_t *err_val)
{
    uint8_t inv = 0, valid = 0;
    __asm__ __volatile__("vmwrite %[value], %[field]; setc %[inval]; setz %[valid]\n"
                         : [valid] "=rm"(valid), [inval] "=rm"(inv)
                         : [field] "r"(field), [value] "rm"(value)
                         : "cc", "memory");
    *err_inv = inv;
    *err_val = valid;
}
#define CHECKED_VMWRITE(field, value)                                                              \
    {                                                                                              \
        vmwrite(field, value, &err_inv, &err_val);                                                 \
        CHECK_VMFAIL("CHECKED_VMWRITE");                                                           \
    }

static int check_vmx_controls(uint32_t options, uint32_t msr)
{
    uint64_t msr_value = rdmsr64(msr);
    uint32_t mask_low = msr_value & 0xFFFFFFFF; // 1 low bits indicate must-one
    uint32_t mask_high = msr_value >> 32;       // zero high bits indicate must-zero

    if ((~options & mask_low) || (options & ~mask_high)) {
        PRINT_ERR("VMX MSR 0x%x: bits not supported (value 0x%x, mask l-0x%x h-0x%x)\n", msr,
                  options, mask_low, mask_high);
        return -1;
    }

    return 0;
}

#define VMWRITE_GUEST_SEGMENT(segment, selector, base, limit, ar)                                  \
    {                                                                                              \
        CHECKED_VMWRITE(GUEST_##segment##_SELECTOR, selector);                                     \
        CHECKED_VMWRITE(GUEST_##segment##_BASE, base);                                             \
        CHECKED_VMWRITE(GUEST_##segment##_LIMIT, limit);                                           \
        CHECKED_VMWRITE(GUEST_##segment##_AR_BYTES, ar);                                           \
    }

// =================================================================================================
// VMX management interface
// (functions exposed to the rest of the executor)
// =================================================================================================

/// @brief Check whether the target CPU is compatible with our implementation of VMX management
/// @return 0 is compatible, -1 otherwise
int vmx_check_cpu_compatibility(void)
{
    uint64_t msr_value = 0;

    // Check if VMX is supported
    ASSERT_MSG(cpu_has(cpuinfo, X86_FEATURE_VMX), "vmx_check_cpu_compatibility",
               "VMX is not supported on this CPU");

    // Control registers
    uint64_t cr0 = read_cr0();
    uint64_t cr4 = __read_cr4();
    uint64_t efer = rdmsr64(MSR_EFER);
    ASSERT((cr0 & X86_CR0_PE) != 0, "set_vmcs_guest_state");
    ASSERT((cr0 & X86_CR0_PG) != 0, "set_vmcs_guest_state");
    ASSERT((cr4 & X86_CR4_PAE) != 0, "set_vmcs_guest_state");
    ASSERT((efer & EFER_LME) != 0, "set_vmcs_guest_state");
    ASSERT((efer & EFER_LMA) != 0, "set_vmcs_guest_state");

    // True controls are usable
    msr_value = rdmsr64(MSR_IA32_VMX_BASIC);
    ASSERT((msr_value & VMX_BASIC_TRUE_CTLS) != 0, "vmx_check_cpu_compatibility");

    // Pin-based controls
    supported_vmcs_pin_ctrl = rdmsr64(MSR_IA32_VMX_TRUE_PINBASED_CTLS);
    ASSERT((supported_vmcs_pin_ctrl & MUST_CLEAR_PIN_BASED_VM_EXEC_CONTROL) == 0,
           "vmx_check_cpu_compatibility");

    // Primary processor-based controls
    supported_vmcs_primary_ctrl = rdmsr64(MSR_IA32_VMX_TRUE_PROCBASED_CTLS);
    ASSERT((supported_vmcs_primary_ctrl & MUST_CLEAR_PRIMARY_VM_EXEC_CONTROL) == 0,
           "vmx_check_cpu_compatibility");

    // Secondary
    supported_vmcs_secondary_ctrl = rdmsr64(MSR_IA32_VMX_PROCBASED_CTLS2);
    ASSERT((supported_vmcs_secondary_ctrl & MUST_CLEAR_SECONDARY_VM_EXEC_CONTROL) == 0,
           "vmx_check_cpu_compatibility");

    // Exit/entry
    msr_value = rdmsr64(MSR_IA32_VMX_TRUE_EXIT_CTLS);
    ASSERT((msr_value & MUST_CLEAR_EXIT_CTRL) == 0, "vmx_check_cpu_compatibility");
    msr_value = rdmsr64(MSR_IA32_VMX_TRUE_ENTRY_CTLS);
    ASSERT((msr_value & MUST_CLEAR_ENTRY_CTRL) == 0, "vmx_check_cpu_compatibility");

    return 0;
}

/// @brief Enable VMX operation and do VMXON
/// @return 0 on success, negative error code on failure
int start_vmx_operation(void)
{
    uint8_t err_inv = 0, err_val = 0;

    orig_vmxon_state = ((orig_special_registers_state->cr4 & X86_CR4_VMXE) != 0);
    unsigned long cr4 = __read_cr4();
    unsigned long cr0 = read_cr0();

    if (!orig_vmxon_state) {
        // Note: registers are already configured in special_registers.c:set_msrs_for_vmx

        // Check SDM 24.8 "restrictions on VMX operation" and 24.7 "Enabling and entering VMX"
        ASSERT(((cr0 & rdmsr64(MSR_IA32_VMX_CR0_FIXED1)) | rdmsr64(MSR_IA32_VMX_CR0_FIXED0)) == cr0,
               "start_vmx_operation");
        ASSERT((cr4 | X86_CR4_VMXE) == cr4, "start_vmx_operation");

        // Configure IA32_FEATURE_CONTROL MSR to allow VMXON
        //   Bit 0: Lock bit. If clear, VMXON causes a #GP.
        //   Bit 2: Enables VMXON outside of SMX operation. If clear, VMXON
        //          outside of SMX causes a #GP.
        uint64_t feature_control = rdmsr64(MSR_FEATURE_CONTROL);
        uint64_t required = FEATURE_VMX_ENABLED_OUTSIDE_SMX | FEATURE_CTL_LOCKED;
        if ((feature_control & required) != required)
            wrmsr64(MSR_FEATURE_CONTROL, feature_control | required);

        // Prepare VMXON region:
        // (source: SDM, 25.11.5 VMXON Region)
        // - Write the revision identifier into bits 30:0, and clear bit 31
        memset(vmxon_page_hva, 0, VMXON_SIZE);
        ((vmxon_region_t *)vmxon_page_hva)->revision_id = rdmsr64(MSR_IA32_VMX_BASIC);
        ((vmxon_region_t *)vmxon_page_hva)->reserved_31 = 0;

        // Run VMXON
        vmxon(vmxon_page_hpa, &err_inv, &err_val);
        CHECK_VMFAIL("vmx_start_operation");
    }

    vmx_is_on = true;
    return 0;
}

/// @brief Disable VMX operation and do VMXOFF
/// Should never fail as this function can be used in exception handlers;
/// instead, it will print warning upon error.
/// @return void
void stop_vmx_operation(void)
{
    // PRINT_ERR("Stopping VMX operation\n");
    uint8_t err_inv = 0, err_val = 0;

    // Run VMXOFF
    if (vmx_is_on && !orig_vmxon_state) {
        // Flush all EPT TLB entries before vmxoff to ensure no stale EPT translations remain
        uint64_t invept_desc[2] = {0, 0};
        asm volatile("invept %0, %1" : : "m"(invept_desc), "r"(2ULL) : "cc", "memory");

        vmxoff(&err_inv, &err_val);
        orig_vmxon_state = false;
    }

    vmx_is_on = false;
    if (err_inv || err_val)
        PRINT_ERRS("stop_vmx_operation", "Exited with VMfailInvalid=%d, VMfailValid=%d\n", err_inv,
                   err_val);
}

/// @brief Restore the VMCS state that was active when we started
/// @param void
/// @return 0 on success, negative error code on failure
int store_orig_vmcs_state(void)
{
    if (!orig_vmxon_state)
        return 0; // VMX was not in use when we started; nothing to store

    uint8_t err_inv = 0, err_val = 0;
    vmptrst(&orig_vmcs_ptr, &err_inv, &err_val);
    CHECK_VMFAIL("store_orig_vmcs_state");
    return 0;
}

/// @brief Restore the VMCS state that was active when we started
/// Should never fail as this function can be used in exception handlers;
/// instead, it prints warnings upon errors.
/// @return void
void restore_orig_vmcs_state(void)
{
    uint8_t err_inv = 0, err_val = 0;
    if (!orig_vmxon_state || orig_vmcs_ptr == 0xFFFFFFFFFFFFFFFF)
        return;

    if (!vmx_is_on) {
        PRINT_ERR("ERROR: attempting to restore VMX state while VMX is not on\n");
        return;
    }

    if (!orig_vmcs_ptr) {
        PRINT_ERR("ERROR: attempting to restore VMX state but no state was stored\n");
        return;
    }

    vmptrld(orig_vmcs_ptr, &err_inv, &err_val);
    if (err_inv || err_val)
        PRINT_ERRS("restore_orig_vmcs_state", "Exited with VMfailInvalid=%d, VMfailValid=%d\n",
                   err_inv, err_val);
}

int set_vmcs_state(void)
{
    int err = 0;
    uint8_t err_inv = 0, err_val = 0;

    // if necessary, allocate additional memory for VMCSs
    ASSERT(n_actors <= MAX_ACTORS, "set_vmcs_state:n_actors exceeds MAX_ACTORS");
    static unsigned old_n_actors = 0;
    if (n_actors > old_n_actors) {
        SAFE_VFREE(vmcss);
        vmcss = CHECKED_VMALLOC(n_actors * VMCS_SIZE);
    }
    old_n_actors = n_actors;

    // initialize VMCSs for all guest actors
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        // skip non-guest actors
        actor_metadata_t *actor = &actors[actor_id];
        if (actor->mode != MODE_GUEST)
            continue;

        vmcs_t *vmcs_hva = &vmcss[actor_id];
        uint64_t vmcs_hpa = vmalloc_to_phys(vmcs_hva);
        ASSERT(vmcs_hpa != 0, "set_vmcs_state:vmalloc_to_phys");
        vmcs_hpas[actor_id] = vmcs_hpa;

        // initialize VMCS revision identifier
        memset(vmcs_hva, 0, VMCS_SIZE);
        vmcs_hva->revision_id = rdmsr64(MSR_IA32_VMX_BASIC);
        vmcs_hva->abort_indicator = 0;

        // load VMCS
        vmclear(vmcs_hpa, &err_inv, &err_val);
        CHECK_VMFAIL("set_vmcs_state:vmclear");

        vmptrld(vmcs_hpa, &err_inv, &err_val);
        CHECK_VMFAIL("set_vmcs_state:vmptrld");

        // set VMCS fields
        err = set_vmcs_guest_state();
        CHECK_ERR("set_vmcs_guest_state");

        err = set_vmcs_host_state();
        CHECK_ERR("set_vmcs_host_state");

        err = set_vmcs_exec_control(actor_id);
        CHECK_ERR("set_vmcs_exec_control");

        err = set_vmcs_exit_control();
        CHECK_ERR("set_vmcs_exit_control");

        err = set_vmcs_entry_control();
        CHECK_ERR("set_vmcs_entry_control");

        err = make_vmcs_launched(actor_id);
        CHECK_ERR("set_vmcs_state:make_vmcs_launched");
    }

    return 0;
}

static int set_vmcs_guest_state(void)
{
    uint8_t err_inv = 0, err_val = 0;
    guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
    guest_memory_t *guest_p_memory = (guest_memory_t *)(GUEST_P_MEMORY_START);

    // SDM 25.4 Guest-State Area
    // - Control registers
    uint64_t cr0 = (read_cr0() | MUST_SET_BITS_CR0_VMX_GUEST) & ~MUST_CLEAR_BITS_CR0_VMX_GUEST;
    uint64_t cr4 = (__read_cr4() | MUST_SET_BITS_CR4_VMX_GUEST) & ~MUST_CLEAR_BITS_CR4_VMX_GUEST;
    CHECKED_VMWRITE(GUEST_CR0, cr0);
    CHECKED_VMWRITE(GUEST_CR3, (uint64_t)&guest_p_memory->guest_page_tables.l4[0]);
    CHECKED_VMWRITE(GUEST_CR4, cr4);

    // - Debug register
    CHECKED_VMWRITE(GUEST_DR7, 0x400);

    // - RSP, RIP, and RFLAGS
    // (see also make_vmcs_launched)
    CHECKED_VMWRITE(GUEST_RSP, (uint64_t)&guest_v_memory->data.main_area[LOCAL_RSP_OFFSET]);
    CHECKED_VMWRITE(GUEST_RIP, (uint64_t)&guest_v_memory->vmlaunch_page[0]);
    CHECKED_VMWRITE(GUEST_RFLAGS, (X86_EFLAGS_FIXED));

    // - Segments (values mainly based on https://www.sandpile.org/x86/initial.htm)
    VMWRITE_GUEST_SEGMENT(CS, 0x10, 0, 0xFFFF, 0xa09B);
    VMWRITE_GUEST_SEGMENT(SS, 0x20, 0, 0xFFFF, 0xc093);
    VMWRITE_GUEST_SEGMENT(DS, 0, 0, 0xFFFF, 0x10000); // 0xc093
    VMWRITE_GUEST_SEGMENT(ES, 0, 0, 0xFFFF, 0x10000);
    VMWRITE_GUEST_SEGMENT(FS, 0, 0, 0xFFFF, 0x10000);
    VMWRITE_GUEST_SEGMENT(GS, 0, 0, 0xFFFF, 0x10000);
    VMWRITE_GUEST_SEGMENT(LDTR, 0, 0, 0xFFFF, 0x10000); // 0xc082);
    VMWRITE_GUEST_SEGMENT(TR, 0, 0, 0xFFFF, 0x8b);

    // - GDTR and IDTR (left empty for the time being; attempt to use will cause VM exit)
    CHECKED_VMWRITE(GUEST_GDTR_BASE, (uint64_t)&guest_v_memory->gdt);
    CHECKED_VMWRITE(GUEST_GDTR_LIMIT, 0xFFFF);
    CHECKED_VMWRITE(GUEST_IDTR_BASE, 0);
    CHECKED_VMWRITE(GUEST_IDTR_LIMIT, 0xFFFF);

    // - MSRs
    CHECKED_VMWRITE(GUEST_IA32_DEBUGCTL, 0);
    CHECKED_VMWRITE(GUEST_SYSENTER_CS, 0x10);
    CHECKED_VMWRITE(GUEST_SYSENTER_ESP,
                    (uint64_t)&guest_v_memory->data.main_area[LOCAL_RSP_OFFSET]);
    CHECKED_VMWRITE(GUEST_SYSENTER_EIP, (uint64_t)&guest_v_memory->code.section[0]);

    ASSERT((VM_ENTRY_LOAD_IA32_PERF_GLOBAL_CTRL & MUST_CLEAR_ENTRY_CTRL) != 0,
           "set_vmcs_guest_state");
    ASSERT((VM_ENTRY_LOAD_IA32_PAT & MUST_CLEAR_ENTRY_CTRL) != 0, "set_vmcs_guest_state");
    ASSERT((VM_ENTRY_LOAD_IA32_EFER & MUST_CLEAR_ENTRY_CTRL) != 0, "set_vmcs_guest_state");

    // SDM 25.4.2 Guest Non-Register State
    CHECKED_VMWRITE(GUEST_ACTIVITY_STATE, 0);
    CHECKED_VMWRITE(GUEST_INTERRUPTIBILITY_INFO, 0b1000); // block NMI
    CHECKED_VMWRITE(GUEST_PENDING_DBG_EXCEPTIONS, 0);
    CHECKED_VMWRITE(VMCS_LINK_POINTER, -1LL);
    CHECKED_VMWRITE(VMX_PREEMPTION_TIMER_VALUE, 0xFFFF); // FIXME: make configurable

    return 0;
}

static int set_vmcs_host_state(void)
{
    uint8_t err_inv = 0, err_val = 0;

    // get TR, GDTR, IDTR and LDTR bases (will be necessary later, in several places)
    uint64_t tr = 0, ldtr = 0;
    struct desc_ptr gdtr, idtr;
    asm volatile("str %[tr]\n"
                 "sgdt %[gdtr]\n"
                 "sidt %[idtr]\n"
                 "sldt %[ldtr]\n"
                 : [tr] "=r"(tr), [gdtr] "=m"(gdtr), [idtr] "=m"(idtr), [ldtr] "=r"(ldtr)
                 :
                 : "memory");
    struct ldttss_desc *tr_register = (struct ldttss_desc *)(gdtr.address + tr);
    uint64_t tr_base = ((uint64_t)tr_register->base0 | ((tr_register->base1) << 16) |
                        ((tr_register->base2) << 24) | ((uint64_t)tr_register->base3 << 32));

    // SDM 25.5 Host-State Area
    // - Control registers
    CHECKED_VMWRITE(HOST_CR0, read_cr0());
    CHECKED_VMWRITE(HOST_CR3, __read_cr3());
    CHECKED_VMWRITE(HOST_CR4, __read_cr4());

    // - RSP and RIP
    // set later (make_vmcs_launched)

    // - Segment selectors
    CHECKED_VMWRITE(HOST_CS_SELECTOR, __KERNEL_CS);
    CHECKED_VMWRITE(HOST_SS_SELECTOR, __KERNEL_DS);
    CHECKED_VMWRITE(HOST_DS_SELECTOR, 0);
    CHECKED_VMWRITE(HOST_ES_SELECTOR, 0);
    CHECKED_VMWRITE(HOST_FS_SELECTOR, 0);
    CHECKED_VMWRITE(HOST_GS_SELECTOR, 0);
    CHECKED_VMWRITE(HOST_TR_SELECTOR, tr);

    // - Segment bases
    CHECKED_VMWRITE(HOST_FS_BASE, rdmsr64(MSR_FS_BASE));
    CHECKED_VMWRITE(HOST_GS_BASE, rdmsr64(MSR_GS_BASE));
    CHECKED_VMWRITE(HOST_TR_BASE, tr_base);
    CHECKED_VMWRITE(HOST_GDTR_BASE, gdtr.address);
    CHECKED_VMWRITE(HOST_IDTR_BASE, test_case_idtr.address);

    // - MSRs
    CHECKED_VMWRITE(HOST_IA32_SYSENTER_CS, rdmsr64(MSR_IA32_SYSENTER_CS));
    CHECKED_VMWRITE(HOST_IA32_SYSENTER_ESP, rdmsr64(MSR_IA32_SYSENTER_ESP));
    CHECKED_VMWRITE(HOST_IA32_SYSENTER_EIP, rdmsr64(MSR_IA32_SYSENTER_EIP));
    CHECKED_VMWRITE(HOST_IA32_EFER, rdmsr64(MSR_EFER));

    ASSERT((VM_EXIT_LOAD_IA32_PERF_GLOBAL_CTRL & MUST_CLEAR_EXIT_CTRL) != 0, "set_vmcs_host_state");
    ASSERT((VM_EXIT_LOAD_IA32_PAT & MUST_CLEAR_EXIT_CTRL) != 0, "set_vmcs_host_state");
    return 0;
}

static int set_vmcs_exec_control(int actor_id)
{
    // int err = 0;
    uint8_t err_inv = 0, err_val = 0;

    // SDM 25.6.1 Pin-Based VM-Execution Controls
    uint32_t pin_based_vm_exec_control = MUST_SET_PIN_BASED_VM_EXEC_CONTROL |
                                         (rdmsr64(MSR_IA32_VMX_TRUE_PINBASED_CTLS) & 0xFFFFFFFFULL);
    if (check_vmx_controls(pin_based_vm_exec_control, MSR_IA32_VMX_TRUE_PINBASED_CTLS))
        return -1;
    CHECKED_VMWRITE(PIN_BASED_VM_EXEC_CONTROL, pin_based_vm_exec_control);

    // SDM 25.6.2 Processor-Based VM-Execution Controls
    // - primary
    uint32_t primary_vm_exec_control = MUST_SET_PRIMARY_VM_EXEC_CONTROL |
                                       (rdmsr64(MSR_IA32_VMX_TRUE_PROCBASED_CTLS) & 0xFFFFFFFFULL);
    if (check_vmx_controls(primary_vm_exec_control, MSR_IA32_VMX_TRUE_PROCBASED_CTLS))
        return -1;
    CHECKED_VMWRITE(CPU_BASED_VM_EXEC_CONTROL, primary_vm_exec_control);

    // - secondary
    uint32_t secondary_vm_exec_control = MUST_SET_SECONDARY_VM_EXEC_CONTROL |
                                         (rdmsr64(MSR_IA32_VMX_PROCBASED_CTLS2) & 0xFFFFFFFFULL);
    if (check_vmx_controls(secondary_vm_exec_control, MSR_IA32_VMX_PROCBASED_CTLS2))
        return -1;
    CHECKED_VMWRITE(SECONDARY_VM_EXEC_CONTROL, secondary_vm_exec_control);

    // SDM 25.6.3 Exception Bitmap
    CHECKED_VMWRITE(EXCEPTION_BITMAP, DEFAULT_EXCEPTION_BITMAP);

    // SDM 25.6.4 I/O-Bitmap Addresses
    ASSERT((CPU_BASED_USE_IO_BITMAPS & primary_vm_exec_control) == 0, "set_vmcs_exec_control");

    // SDM 25.6.5 Time-Stamp Counter Offset and Multiplier
    ASSERT((CPU_BASED_USE_TSC_OFFSETTING & primary_vm_exec_control) == 0, "set_vmcs_exec_control");

    // SDM 25.6.6 Guest/Host Masks and Read Shadows for CR0 and CR4
    uint64_t cr0 = read_cr0();
    uint64_t cr4 = __read_cr4();
    CHECKED_VMWRITE(CR0_GUEST_HOST_MASK, cr0);
    CHECKED_VMWRITE(CR4_GUEST_HOST_MASK, cr4);
    CHECKED_VMWRITE(CR0_READ_SHADOW, cr0);
    CHECKED_VMWRITE(CR4_READ_SHADOW, cr4);

    // SDM 25.6.7 CR3-Target Controls
    CHECKED_VMWRITE(CR3_TARGET_COUNT, 0);

    // SDM 25.6.8 Controls for APIC Virtualization
    ASSERT((SECONDARY_EXEC_VIRTUALIZE_APIC_ACCESSES & secondary_vm_exec_control) == 0,
           "set_vmcs_exec_control");

    // SDM 25.6.9 MSR-Bitmap Address
    ASSERT((CPU_BASED_USE_MSR_BITMAPS & primary_vm_exec_control) == 0, "set_vmcs_exec_control");

    // SDM 25.6.10 Executive-VMCS Pointer
    // (no idea, leaving it blank for the time being)

    // SDM 25.6.11 Extended-Page-Table Pointer (EPTP)
    CHECKED_VMWRITE(EPT_POINTER, ((uint64_t *)ept_ptr)[actor_id]);

    // SDM 25.6.12 Virtual-Processor Identifier (VPID)
    ASSERT((SECONDARY_EXEC_ENABLE_VPID & secondary_vm_exec_control) == 0, "set_vmcs_exec_control");

    // SDM 25.6.13 Controls for PAUSE-Loop Exiting
    // not implemented

    // SDM 25.6.14 VM-Functions
    ASSERT((SECONDARY_EXEC_ENABLE_VMFUNC & secondary_vm_exec_control) == 0,
           "set_vmcs_exec_control");

    // SDM 25.6.15 VMCS Shadowing Bitmap Addresses
    ASSERT((SECONDARY_EXEC_SHADOW_VMCS & secondary_vm_exec_control) == 0, "set_vmcs_exec_control");

    // SDM 25.6.16 ENCLS-Exiting Bitmap
    if (supported_vmcs_secondary_ctrl & SECONDARY_EXEC_ENCLS_EXITING) {
        ASSERT((SECONDARY_EXEC_ENCLS_EXITING & secondary_vm_exec_control) != 0,
               "set_vmcs_exec_control");
        CHECKED_VMWRITE(ENCLS_EXITING_BITMAP, 0x0FFFFFFFFFFFFFFFULL);
    }

    // Misc. features (25.6.14--23) are disabled
    return 0;
}

static int set_vmcs_exit_control(void)
{
    uint8_t err_inv = 0, err_val = 0;

    uint64_t exit_ctls =
        MUST_SET_EXIT_CTRL | (rdmsr64(MSR_IA32_VMX_TRUE_EXIT_CTLS) & 0xFFFFFFFFULL);
    if (check_vmx_controls(exit_ctls, MSR_IA32_VMX_TRUE_EXIT_CTLS))
        return -1;
    CHECKED_VMWRITE(VM_EXIT_CONTROLS, exit_ctls);

    // SDM 25.7.2 VM-Exit Controls for MSRs
    CHECKED_VMWRITE(VM_EXIT_MSR_STORE_COUNT, 0);
    CHECKED_VMWRITE(VM_EXIT_MSR_LOAD_COUNT, 0);
    return 0;
}

static int set_vmcs_entry_control(void)
{
    uint8_t err_inv = 0, err_val = 0;

    uint64_t entry_ctls =
        MUST_SET_ENTRY_CTRL | (rdmsr64(MSR_IA32_VMX_TRUE_ENTRY_CTLS) & 0xFFFFFFFFULL);
    if (check_vmx_controls(entry_ctls, MSR_IA32_VMX_TRUE_ENTRY_CTLS))
        return -1;
    CHECKED_VMWRITE(VM_ENTRY_CONTROLS, entry_ctls);

    // SDM 25.8.2 VM-Entry Controls for MSRs
    CHECKED_VMWRITE(VM_ENTRY_MSR_LOAD_COUNT, 0);

    // SDM 25.8.3 VM-Entry Controls for Event Injection
    CHECKED_VMWRITE(VM_ENTRY_INTR_INFO_FIELD, 0);

    return 0;
}

static int make_vmcs_launched(int actor_id)
{
    uint8_t err_inv = 0, err_val = 0;

    // 1. Load VMCS
    uint64_t vmcs_hpa = vmcs_hpas[actor_id];
    vmptrld(vmcs_hpa, &err_inv, &err_val);
    CHECK_VMFAIL("make_vmcs_launched:vmptrld");

    // 2. Launch VM
    //
    // Note 1: HOST_RIP and HOST_RSP must be set in assembly to capture the correct
    // return address and stack pointer for VM exit. After VM exit, guest may have
    // modified any general-purpose registers, so we clobber all caller-saved regs.
    //
    // Note 2: If vmlaunch succeeds, it transfers control to guest and the setc/setz
    // instructions are skipped. On VM exit, we return to label 1 with err flags = 0.
    // If vmlaunch fails, setc/setz execute and we jump to label 1 with error flags set.
    asm volatile(""
                 "xor %[inval], %[inval]\n"
                 "xor %[val], %[val]\n"
                 "lea 1f(%%rip), %%rax\n"
                 "mov %[host_rip], %%rcx\n"
                 "vmwrite %%rax, %%rcx\n"
                 "mov %%rsp, %%rax\n"
                 "mov %[host_rsp], %%rcx\n"
                 "vmwrite %%rax, %%rcx\n"
                 "vmlaunch\n"
                 "setc %[inval]\n"
                 "setz %[val]\n"
                 "1:\n"
                 : [val] "+rm"(err_val), [inval] "+rm"(err_inv)
                 : [host_rip] "i"((uint64_t)HOST_RIP), [host_rsp] "i"((uint64_t)HOST_RSP)
                 : "cc", "memory", "rax", "rcx", "rdx", "rsi", "rdi", "r8", "r9", "r10", "r11");

    // 3. If vmlaunch failed, print error info
    if (err_inv || err_val) {
        print_vmlaunch_error_info(err_inv, err_val, actor_id);
    }
    CHECK_VMFAIL("make_vmcs_launched:vmlaunch");

    // 4. Check that the launch was successful (abort indicator check)
    ASSERT(vmcss[actor_id].abort_indicator == 0, "make_vmcs_launched:abort_indicator");
    uint64_t exit_reason = 0;
    vmread(VM_EXIT_REASON, &exit_reason, &err_inv, &err_val);
    CHECK_VMFAIL("make_vmcs_launched:VM_EXIT_REASON");
    // Expected exit reasons after initial vmlaunch: VMCALL (guest code) or timeout
    ASSERT((exit_reason == EXIT_REASON_VMCALL || exit_reason == EXIT_REASON_PREEMPTION_TIMER),
           "make_vmcs_launched:unexpected exit reason");

    // 5. Finalize VMCS fields
    guest_memory_t *guest_v_memory = (guest_memory_t *)(GUEST_V_MEMORY_START);
    CHECKED_VMWRITE(GUEST_RIP, (uint64_t)&guest_v_memory->code.section[0]);
    CHECKED_VMWRITE(GUEST_RSP, (uint64_t)&guest_v_memory->data.main_area[LOCAL_RSP_OFFSET]);
    CHECKED_VMWRITE(HOST_RIP, (uint64_t)fault_handler);
    CHECKED_VMWRITE(HOST_RSP, (uint64_t)&sandbox->data[0].main_area[LOCAL_RSP_OFFSET]);

    return 0;
}

static void print_vmlaunch_error_info(int err_inv, int err_val, int actor_id)
{
    PRINT_ERR("vmlaunch failed: VMfailInvalid=%d, VMfailValid=%d\n", err_inv, err_val);
    if (err_val) {
        uint64_t instr_error = 0;
        uint8_t tmp_inv = 0, tmp_val = 0;
        vmread(VM_INSTRUCTION_ERROR, &instr_error, &tmp_inv, &tmp_val);
        PRINT_ERR("VM_INSTRUCTION_ERROR: %llu\n", instr_error);
        if (instr_error > 0 && instr_error < 26)
            PRINT_ERR("  decoded: %s\n", vmx_instruction_error_to_str[instr_error]);
    }
    PRINT_ERR("VMCS abort indicator: %d\n", vmcss[actor_id].abort_indicator);
}

int print_vmx_exit_info(void)
{
    uint8_t err_inv = 0, err_val = 0;
    uint64_t value = 0;

    // Abort reasons
    PRINT_ERR("VMX Abort indicators:\n");
    for (int actor_id = 0; actor_id < n_actors; actor_id++) {
        if (actors[actor_id].mode == MODE_GUEST)
            PRINT_ERR("  actor 0x%x: %d\n", actor_id, vmcss[actor_id].abort_indicator);
    }

    // VM exit reason
    PRINT_ERR("VMXC exit info:\n");
    vmread(VM_EXIT_REASON, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VM_EXIT_REASON");
    PRINT_ERR("  VM exit reason: 0x%llx\n", value);
    if (value != 0) {
        uint16_t basic_reason = value & 0xFFFF;
        char *exit_type = NULL;
        if (value & (1ULL << 31))
            exit_type = "entry";
        else
            exit_type = "exit";

        for (int i = 0; vmx_basic_exit_reason_to_str[i].str != NULL; i++) {
            if (basic_reason == vmx_basic_exit_reason_to_str[i].basic_exit_reason) {
                PRINT_ERR("    decoded: %s [%s]\n", vmx_basic_exit_reason_to_str[i].str, exit_type);
                break;
            }
        }
    }

    vmread(EXIT_QUALIFICATION, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:EXIT_QUALIFICATION");
    PRINT_ERR("  Exit qualification: 0x%llx\n", value);

    vmread(GUEST_LINEAR_ADDRESS, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:GUEST_LINEAR_ADDRESS");
    PRINT_ERR("  Guest linear address: 0x%llx\n", value);

    vmread(GUEST_PHYSICAL_ADDRESS, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:GUEST_PHYSICAL_ADDRESS");
    PRINT_ERR("  Guest physical address: 0x%llx\n", value);

    vmread(VM_EXIT_INTR_INFO, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VM_EXIT_INTR_INFO");
    PRINT_ERR("  VM exit interrupt info: 0x%llx\n", value);

    vmread(VM_EXIT_INTR_ERROR_CODE, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VM_EXIT_INTR_ERROR_CODE");
    PRINT_ERR("  VM exit interrupt error code: 0x%llx\n", value);

    vmread(IDT_VECTORING_INFO_FIELD, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:IDT_VECTORING_INFO_FIELD");
    PRINT_ERR("  IDT vectoring info field: 0x%llx\n", value);

    vmread(IDT_VECTORING_ERROR_CODE, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:IDT_VECTORING_ERROR_CODE");
    PRINT_ERR("  IDT vectoring error code: 0x%llx\n", value);

    vmread(VM_EXIT_INSTRUCTION_LEN, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VM_EXIT_INSTRUCTION_LEN");
    PRINT_ERR("  VM exit instruction length: 0x%llx\n", value);

    vmread(VMX_INSTRUCTION_INFO, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VMX_INSTRUCTION_INFO");
    PRINT_ERR("  VM exit instruction info: 0x%llx\n", value);

    vmread(VM_INSTRUCTION_ERROR, &value, &err_inv, &err_val);
    CHECK_VMFAIL("print_vmx_exit_info:VM_INSTRUCTION_ERROR");
    PRINT_ERR("  VM exit instruction error: 0x%llx\n", value);
    if (value > 0 && value < 22)
        PRINT_ERR("    decoded: %s\n", vmx_instruction_error_to_str[value]);

    return 0;
}

// =================================================================================================
int init_vmx(void)
{
    int err = 0;

    // check that the hw-specific region sizes match our constants
    size_t vmxon_size = (rdmsr64(MSR_IA32_VMX_BASIC) >> 32) & 0xFFF;
    ASSERT(vmxon_size <= VMXON_SIZE, "init_vmx");

    // VMX host data structures
    vmxon_page_hva = CHECKED_ZALLOC(VMXON_SIZE);
    vmxon_page_hpa = virt_to_phys(vmxon_page_hva);
    ASSERT((vmxon_page_hpa & 0xFFF) == 0, "init_vmx"); // VMXON region must be 4KB-aligned

    // VMCS
    vmcss = CHECKED_VMALLOC(VMCS_SIZE);
    vmcs_hpas = CHECKED_ZALLOC(sizeof(uint64_t) * MAX_ACTORS);

    return err;
}

void free_vmx(void)
{
    SAFE_FREE(vmxon_page_hva);
    SAFE_VFREE(vmcss);
    SAFE_FREE(vmcs_hpas);
}

// NOLINTEND(readability-function-cognitive-complexity)
// NOLINTEND(readability-function-size)


================================================
FILE: rvzr/factory.py
================================================
"""
File: Configuration factory; constructs objects based on the configuration options.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import Dict, Type, List, TYPE_CHECKING, Any, Optional, Union

from . import data_generator, analyser, executor, fuzzer, model, elf_parser
from .model_unicorn import tracer, speculator_abc, speculators_basic, \
    speculators_fault, speculators_vs, interpreter, model as uc_model
from .model_dynamorio import model as dr_model
from .postprocessing.minimizer import Minimizer

from .arch.x86 import asm_parser as x86_asm_parser, \
    executor as x86_executor, fuzzer as x86_fuzzer, generator as x86_generator, \
    target_desc as x86_target_desc, get_spec as x86_get_spec
from .arch.arm64 import asm_parser as arm64_asm_parser, \
    executor as arm64_executor, fuzzer as arm64_fuzzer, generator as arm64_generator, \
    target_desc as arm64_target_desc, get_spec as arm64_get_spec
from .config import CONF, ConfigException

if TYPE_CHECKING:
    from .isa_spec import InstructionSet
    from .target_desc import TargetDesc
    from .code_generator import CodeGenerator
    from .asm_parser import AsmParser
    from .sandbox import BaseAddrTuple


class FactoryException(SystemExit):
    """ Exception raised by the factory functions """

    def __init__(self, options: Dict[str, Type[Any]], key: str, conf_option_name: str) -> None:
        super().__init__(
            f"ERROR: unknown value `{key}` of `{conf_option_name}` configuration option.\n"
            "  Available options are:\n  - " + "\n  - ".join(options.keys()))


# ==================================================================================================
# Common enumerations
# ==================================================================================================
_TARGET_DESC: Dict[str, Type[TargetDesc]] = {
    "x86-64": x86_target_desc.X86TargetDesc,
    "arm64": arm64_target_desc.ARM64TargetDesc,
}


# ==================================================================================================
# Fuzzer Construction
# ==================================================================================================
def get_fuzzer(instruction_set_path: str, working_directory: str, existing_test_case: str,
               input_paths: Optional[List[str]]) -> fuzzer.Fuzzer:
    """ Construct a fuzzer based on the configuration options in the CONF object. """

    if CONF.fuzzer == "architectural":
        if CONF.instruction_set == "x86-64":
            return x86_fuzzer.X86ArchitecturalFuzzer(instruction_set_path, working_directory,
                                                     existing_test_case, input_paths)
        if CONF.instruction_set == "arm64":
            return arm64_fuzzer.ARM64ArchitecturalFuzzer(instruction_set_path, working_directory,
                                                         existing_test_case, input_paths)
        raise ConfigException("ERROR: unknown value of `instruction_set` configuration option")
    if CONF.fuzzer == "archdiff":
        if CONF.instruction_set == "x86-64":
            return x86_fuzzer.X86ArchDiffFuzzer(instruction_set_path, working_directory,
                                                existing_test_case, input_paths)
        if CONF.instruction_set == "arm64":
            return arm64_fuzzer.ARM64ArchDiffFuzzer(instruction_set_path, working_directory,
                                                    existing_test_case, input_paths)
        raise ConfigException("ERROR: unknown value of `instruction_set` configuration option")
    if CONF.fuzzer == "basic":
        if CONF.instruction_set == "x86-64":
            return x86_fuzzer.X86Fuzzer(instruction_set_path, working_directory, existing_test_case,
                                        input_paths)
        if CONF.instruction_set == "arm64":
            return arm64_fuzzer.ARM64Fuzzer(instruction_set_path, working_directory,
                                            existing_test_case, input_paths)
        raise ConfigException("ERROR: unknown value of `instruction_set` configuration option")
    raise ConfigException("ERROR: unknown value of `fuzzer` configuration option")


# ==================================================================================================
# Executor Construction
# ==================================================================================================
_EXECUTORS = {
    'x86-64-intel': x86_executor.X86IntelExecutor,
    'x86-64-amd': x86_executor.X86AMDExecutor,
    'arm64': arm64_executor.ARM64Executor,
}


def get_executor(enable_mismatch_check_mode: bool = False) -> executor.Executor:
    """ Construct an executor based on the configuration options in the CONF object. """
    key: str = CONF.executor
    if key not in _EXECUTORS:
        raise FactoryException(_EXECUTORS, key, "executor")
    return _EXECUTORS[key](enable_mismatch_check_mode)


# ==================================================================================================
# Model Construction
# ==================================================================================================
_TRACERS: Dict[str, Type[tracer.UnicornTracer]] = {
    "none": tracer.NoneTracer,
    "l1d": tracer.L1DTracer,
    "pc": tracer.PCTracer,
    "memory": tracer.MemoryTracer,
    "ct": tracer.CTTracer,
    "loads+stores+pc": tracer.CTTracer,
    "ct-nonspecstore": tracer.CTNonSpecStoreTracer,
    "arch": tracer.ArchTracer,
    "tct": tracer.TruncatedCTTracer,
    "tcto": tracer.TruncatedCTWithOverflowsTracer,
    "ct-ni": tracer.ActorNITracer,
}

_SPECULATORS_GENERIC: Dict[str, Type[speculator_abc.UnicornSpeculator]] = {
    "seq": speculators_basic.SeqSpeculator,
    "no_speculation": speculators_basic.SeqSpeculator,
    "bpas": speculators_basic.StoreBpasSpeculator,
    "cond-bpas": speculators_basic.X86CondBpasSpeculator,
    "seq-assist": speculators_fault.SequentialAssistSpeculator,
}

_SPECULATORS_X86: Dict[str, Type[speculator_abc.UnicornSpeculator]] = {
    **_SPECULATORS_GENERIC,
    "cond": speculators_basic.X86CondSpeculator,
    "conditional_br_misprediction": speculators_basic.X86CondSpeculator,
    "delayed-exception-handling": speculators_fault.X86UnicornDEH,
    "nullinj-fault": speculators_fault.X86UnicornNull,
    "nullinj-assist": speculators_fault.X86UnicornNullAssist,
    "meltdown": speculators_fault.X86Meltdown,
    "noncanonical": speculators_fault.X86NonCanonicalAddress,
    "vspec-ops-div": speculators_vs.VspecDIVSpeculator,
    "vspec-ops-memory-faults": speculators_vs.VspecMemoryFaultsSpeculator,
    "vspec-ops-memory-assists": speculators_vs.VspecMemoryAssistsSpeculator,
    "vspec-ops-gp": speculators_vs.VspecGPSpeculator,
    "vspec-all-div": speculators_vs.VspecAllDIVSpeculator,
    "vspec-all-memory-faults": speculators_vs.VspecAllMemoryFaultsSpeculator,
    "vspec-all-memory-assists": speculators_vs.VspecAllMemoryAssistsSpeculator,
}

_SPECULATORS_ARM64: Dict[str, Type[speculator_abc.UnicornSpeculator]] = {
    **_SPECULATORS_GENERIC,
    "cond": speculators_basic.ARM64CondSpeculator,
    "conditional_br_misprediction": speculators_basic.ARM64CondSpeculator,
    "delayed-exception-handling": speculators_fault.ARMUnicornDEH,
}


def _get_exec_clause_name() -> str:
    """ Determine the name of the execution clause based on the configuration options """
    if "cond" in CONF.contract_execution_clause and "bpas" in CONF.contract_execution_clause:
        clause_name = "cond-bpas"
    elif "conditional_br_misprediction" in CONF.contract_execution_clause and \
            "nullinj-fault" in CONF.contract_execution_clause:
        clause_name = "cond-nullinj-fault"
    elif len(CONF.contract_execution_clause) == 1:
        clause_name = CONF.contract_execution_clause[0]
    else:
        raise ConfigException(
            "ERROR: unknown value of `contract_execution_clause` configuration option")
    return clause_name


def _get_x86_unicorn_model(bases: BaseAddrTuple, obs_clause_name: str, exec_clause_name: str,
                           enable_mismatch_check_mode: bool) -> model.Model:
    target_desc = _TARGET_DESC[CONF.instruction_set]()
    tracer_cls = _TRACERS[obs_clause_name]
    speculator_cls = _SPECULATORS_X86[exec_clause_name]
    interpreter_cls = interpreter.X86ExtraInterpreter
    model_ = uc_model.X86UnicornModel(bases, target_desc, speculator_cls, tracer_cls,
                                      interpreter_cls, enable_mismatch_check_mode)
    return model_


def _get_arm64_unicorn_model(bases: BaseAddrTuple, obs_clause_name: str, exec_clause_name: str,
                             enable_mismatch_check_mode: bool) -> model.Model:
    target_desc = _TARGET_DESC[CONF.instruction_set]()
    tracer_cls = _TRACERS[obs_clause_name]
    speculator_cls = _SPECULATORS_ARM64[exec_clause_name]
    interpreter_cls = interpreter.ARMExtraInterpreter
    model_ = uc_model.ARM64UnicornModel(bases, target_desc, speculator_cls, tracer_cls,
                                        interpreter_cls, enable_mismatch_check_mode)
    return model_


def _get_dr_model(bases: BaseAddrTuple, obs_clause_name: str, exec_clause_name: str,
                  enable_mismatch_check_mode: bool) -> model.Model:
    # DR backend is not implemented in python, so we have to call its API
    # to check if the contract is supported
    obs_clauses = dr_model.DynamoRIOModel.get_supported_obs_clauses()
    exec_clauses = dr_model.DynamoRIOModel.get_supported_exec_clauses()

    if obs_clause_name not in obs_clauses:
        raise ConfigException(f"ERROR: unsupported observation clause `{obs_clause_name}`.\n"
                              f"  Available options are:\n  - " + "\n  - ".join(obs_clauses))
    if exec_clause_name not in exec_clauses:
        raise ConfigException(f"ERROR: unsupported execution clause `{exec_clause_name}`.\n"
                              f"  Available options are:\n  - " + "\n  - ".join(exec_clauses))
    model_ = dr_model.DynamoRIOModel(bases, enable_mismatch_check_mode=enable_mismatch_check_mode)
    model_.configure_clauses(obs_clause_name, exec_clause_name)
    return model_


def get_model(bases: BaseAddrTuple, enable_mismatch_check_mode: bool = False) -> model.Model:
    """ Construct a model based on the configuration options in the CONF object. """
    obs_clause_name = CONF.contract_observation_clause
    exec_clause_name = _get_exec_clause_name()

    if CONF.instruction_set == "x86-64":
        if CONF.model_backend == "unicorn":
            return _get_x86_unicorn_model(bases, obs_clause_name, exec_clause_name,
                                          enable_mismatch_check_mode)
        if CONF.model_backend == "dynamorio":
            return _get_dr_model(bases, obs_clause_name, exec_clause_name,
                                 enable_mismatch_check_mode)
        if CONF.model_backend == "dummy":
            return model.DummyModel(bases, enable_mismatch_check_mode)

        raise ConfigException("ERROR: unknown value of `model_backend` configuration option")

    if CONF.instruction_set == "arm64":
        if CONF.model_backend == "unicorn":
            return _get_arm64_unicorn_model(bases, obs_clause_name, exec_clause_name,
                                            enable_mismatch_check_mode)
        if CONF.model_backend == "dynamorio":
            raise ConfigException("ERROR: DynamoRIO backend is not supported for ARM64")
        if CONF.model_backend == "dummy":
            return model.DummyModel(bases, enable_mismatch_check_mode)

        raise ConfigException("ERROR: unknown value of `model_backend` configuration option")

    raise ConfigException("ERROR: unknown value of `instruction_set` configuration option")


# ==================================================================================================
# Program Generator Construction and Related Classes
# ==================================================================================================
_GENERATORS: Dict[str, Type[CodeGenerator]] = {
    "x86-64": x86_generator.X86Generator,
    "arm64": arm64_generator.ARM64Generator,
}

_ASM_PARSERS: Dict[str, Type[AsmParser]] = {
    'x86-64': x86_asm_parser.X86AsmParser,
    'arm64': arm64_asm_parser.ARM64AsmParser,
}

_ELF_PARSERS: Dict[str, Type[elf_parser.ELFParser]] = {
    'x86-64': elf_parser.ELFParser,
    'arm64': elf_parser.ELFParser,
}


def get_program_generator(seed: int, instruction_set: InstructionSet) -> CodeGenerator:
    """
    Produce a ProgramGenerator object based on the configuration options in the CONF object.
    """
    key: str = CONF.instruction_set
    target_desc = _TARGET_DESC[key]()
    elf_parser_ = _ELF_PARSERS[key](target_desc)
    asm_parser = _ASM_PARSERS[key](instruction_set, target_desc)
    generator = _GENERATORS[key](seed, instruction_set, target_desc, asm_parser, elf_parser_)
    return generator


def get_asm_parser(instruction_set: InstructionSet) -> AsmParser:
    """ Produce an AsmParser object based on the configuration options in the CONF object. """
    key: str = CONF.instruction_set
    target_desc = _TARGET_DESC[key]()
    asm_parser = _ASM_PARSERS[key](instruction_set, target_desc)
    return asm_parser


def get_elf_parser() -> elf_parser.ELFParser:
    """ Produce an ELFParser object based on the configuration options in the CONF object. """
    key: str = CONF.instruction_set
    target_desc = _TARGET_DESC[key]()
    elf_parser_ = _ELF_PARSERS[key](target_desc)
    return elf_parser_


# ==================================================================================================
# Input Data Generator Construction
# ==================================================================================================
_DATA_GENERATORS: Dict[str, Type[data_generator.DataGenerator]] = {
    'random': data_generator.DataGenerator,
}


def get_data_generator(seed: int) -> data_generator.DataGenerator:
    """ Produce an DataGenerator object based on the configuration options in the CONF object. """
    key: str = CONF.data_generator
    if key not in _DATA_GENERATORS:
        raise FactoryException(_DATA_GENERATORS, key, "data_generator")
    return _DATA_GENERATORS[key](seed)


# ==================================================================================================
# Analyser Construction
# ==================================================================================================
_ANALYZERS: Dict[str, Type[analyser.Analyser]] = {
    'bitmaps': analyser.MergedBitmapAnalyser,
    'sets': analyser.SetAnalyser,
    'mwu': analyser.MWUAnalyser,
    'chi2': analyser.ChiSquaredAnalyser,
}


def get_analyser() -> analyser.Analyser:
    """ Construct an analyser based on the configuration options in the CONF object. """
    key: str = CONF.analyser
    if key not in _ANALYZERS:
        raise FactoryException(_ANALYZERS, key, "analyser")
    return _ANALYZERS[key]()


# ==================================================================================================
# Minimizer Construction
# ==================================================================================================
_MINIMIZERS: Dict[str, Type[Minimizer]] = {
    'violation': Minimizer,
}


def get_minimizer(fuzzer_: fuzzer.Fuzzer, instruction_set: InstructionSet) -> Minimizer:
    """ Construct a minimizer based on the configuration options in the CONF object. """
    key: str = "violation"  # expansion point for future; currently hardcoded
    if key not in _MINIMIZERS:
        raise FactoryException(_MINIMIZERS, key, "minimizer")
    return _MINIMIZERS[key](fuzzer_, instruction_set)


# ==================================================================================================
# Spec Downloader Construction
# ==================================================================================================
Downloader = Union[x86_get_spec.Downloader, arm64_get_spec.Downloader]

_SPEC_DOWNLOADERS: Dict[str, Type[Downloader]] = {
    'x86-64': x86_get_spec.Downloader,
    'arm64': arm64_get_spec.Downloader,
}


def get_downloader(arch: str, extensions: List[str], out_file: str) -> Downloader:
    """ Construct a class that downloads an ISA spec for the given architecture. """
    key: str = arch
    if key not in _SPEC_DOWNLOADERS:
        raise FactoryException(_SPEC_DOWNLOADERS, key, "downloader")
    return _SPEC_DOWNLOADERS[key](extensions, out_file)


================================================
FILE: rvzr/fuzzer.py
================================================
"""
File: Fuzzing Orchestration

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=too-many-instance-attributes

from __future__ import annotations

import shutil
import os
import tempfile
from pathlib import Path
from datetime import datetime
from typing import TYPE_CHECKING, Optional, List, Callable, Literal, Final
from typing_extensions import assert_never
import numpy as np

from . import factory

from .traces import HTrace, CTrace, Violation, RawHTraceSample, ArrayOfSamples, CTraceEntry, \
    TraceBundle
from .tc_components.actor import ActorMode
from .tc_components.test_case_code import TestCaseProgram
from .tc_components.test_case_data import InputData
from .isa_spec import InstructionSet
from .analyser import Analyser
from .config import CONF
from .stats import FuzzingStats
from .logs import FuzzLogger, warning, update_logging_after_config_change

if TYPE_CHECKING:
    from .code_generator import CodeGenerator
    from .data_generator import DataGenerator
    from .asm_parser import AsmParser
    from .elf_parser import ELFParser
    from .model import Model
    from .executor import Executor

FuzzingMode = Literal["random", "template", "asm"]
RoundStage = Literal["fast", "nesting", "taint_mistake", "priming", "noise", "arch_mismatch",
                     "priming_large"]

STAT = FuzzingStats()


# ==================================================================================================
# Private: Round Manager
# ==================================================================================================
class _RoundState:
    """
    Collection of configuration options for various modules
    in Revizor that are used in a fuzzing round, and that get updated
    as the round progresses.
    """
    executor_n_reps: int
    """ The number of repetitions to be used by the executor """

    _start_nesting: int
    max_nesting: int
    model_nesting: int
    """ Nesting level to be used by the model """

    enable_fast_contract_tracing: bool
    """ Whether to use the fast boosting feature in the _boost_inputs function """

    enable_priming: bool
    """ Whether to use the priming stage of the fuzzing round """

    record_stats: bool = True
    """ Whether to record statistics in the analyser """

    update_ignore_list: bool = False
    """ Whether to update the ignore list of the executor """

    reuse_boosts: bool = False
    """ Whether to reuse the boosted inputs collected by the previous stage of the round """

    reuse_ctraces: bool = False
    """ Whether to reuse contract traces collected by the previous stage of the round """

    extend_htraces: bool = False
    """ If true, all new collected htraces will be added
    to the existing ones instead of replacing them """

    is_initial: bool = True
    """ Whether this is the first round of the fuzzing process """

    def __init__(self, is_speculative: bool) -> None:
        self.executor_n_reps = CONF.executor_sample_sizes[0]

        self._start_nesting = CONF.model_min_nesting if is_speculative else 1
        self.max_nesting = CONF.model_max_nesting if is_speculative else 1
        assert self._start_nesting <= self.max_nesting
        self.model_nesting = self._start_nesting

        self.enable_fast_contract_tracing = CONF.enable_fast_path_model
        self.enable_priming = CONF.enable_priming


class _RoundManager:
    """
    A helper class responsible for maintaining a consistent configuration throughout
    a fuzzing round, as well as for dispatching the test case to the model and executor.
    """
    test_case: TestCaseProgram
    org_inputs: List[InputData]
    boosted_inputs: List[InputData]

    htraces: List[HTrace]
    _reference_htraces: List[HTrace]

    ctraces: List[CTrace]
    _non_boosted_ctraces: List[CTrace]

    violations: List[Violation]
    arch_violations: List[Violation]

    fuzzer: Final[Fuzzer]
    conf: Final[_RoundState]

    def __init__(self, fuzzer: Fuzzer, test_case: TestCaseProgram, inputs: List[InputData]) -> None:
        self.test_case = test_case
        self.org_inputs = inputs
        self.boosted_inputs = []

        self.htraces = []
        self.ctraces = []
        self.violations = []
        self.arch_violations = []

        self.fuzzer = fuzzer
        self.conf = _RoundState(fuzzer.model.is_speculative)

        self.fuzzer.model.load_test_case(self.test_case)
        self.fuzzer.executor.load_test_case(self.test_case)

    def execute_stage(self, stage: RoundStage) -> None:
        """ Run a given stage of the fuzzing round """
        # pylint: disable=too-many-return-statements
        # pylint: disable=too-many-branches
        # NOTE: This a selector function, so the large number of returns is justified

        if stage == "fast":
            assert self.conf.is_initial, "Fast path can be run only in the first round"
            self._normal_stage()
            self.conf.is_initial = False  # make sure that the fast path is run only once
            self.conf.record_stats = False  # record stats only in the fast path
            self._reference_htraces = self.htraces  # use the fast path traces as a reference
            return

        if stage == "nesting":
            if self.conf.model_nesting != self.conf.max_nesting:
                self.conf.model_nesting = self.conf.max_nesting
                self._normal_stage()

            # after this stage, the list of boosted inputs is stable, so we can start reusing
            # them, and we can also start ignoring non-violating inputs in the executor
            self.conf.reuse_boosts = True
            self.conf.update_ignore_list = True
            return

        if stage == "taint_mistake":
            if self.conf.enable_fast_contract_tracing:  # applicable only after fast tracing

                self.conf.enable_fast_contract_tracing = False
                self._normal_stage()

            # after `nesting` and `taint_mistake` stages, we can be confident in contract traces
            # and can start reusing them
            assert self.conf.model_nesting == self.conf.max_nesting, "Invalid stage order"
            self.conf.reuse_ctraces = True
            return

        if stage == "priming":
            if not self.conf.enable_priming:
                return
            self._priming_check()
            return

        if stage == "noise":
            if len(CONF.executor_sample_sizes) == 1:
                return
            self.conf.extend_htraces = True

            for sample_size in CONF.executor_sample_sizes[1:]:
                self.fuzzer.log.sample_size_increase(sample_size)
                self.conf.executor_n_reps = sample_size - len(self.htraces[0])
                self._normal_stage()
                if not self.violations:
                    return
            return

        if stage == "priming_large":
            if not self.conf.enable_priming or len(CONF.executor_sample_sizes) == 1:
                return
            self.conf.executor_n_reps = CONF.executor_sample_sizes[-1]
            self._priming_check()
            return

        if stage == "arch_mismatch":
            self._check_for_architectural_mismatch()
            return

    def finalize(self) -> None:
        """ Finalize the fuzzing round """
        self.fuzzer.log.dbg_dump_traces(self.boosted_inputs, self.htraces, self._reference_htraces,
                                        self.ctraces)

    def _normal_stage(self) -> None:
        """ Run a single stage of the fuzzing round """
        self._boost_inputs()
        self._collect_ctraces()
        try:
            self._collect_htraces()
        except IOError:
            self.violations = []
            return
        if len(self.org_inputs) > 0:
            self._check_violations()
            if not self.violations:
                return
            self._update_ignore_list()

    def _boost_inputs(self) -> None:
        """
        Trace the test case with the original inputs, collect taints, and use them to
        generate boosted inputs
        """
        # no need to taint track if we aren't going to boost
        if CONF.inputs_per_class == 1:
            self._non_boosted_ctraces = \
                self.fuzzer.model.trace_test_case(self.org_inputs, self.conf.model_nesting)
            self.boosted_inputs = self.org_inputs
            return

        # Normal case - boost the inputs
        self._non_boosted_ctraces, taints = \
            self.fuzzer.model.trace_test_case_with_taints(self.org_inputs, self.conf.model_nesting)
        self.boosted_inputs = self.fuzzer.data_gen.generate_boosted(self.org_inputs, taints,
                                                                    CONF.inputs_per_class)

    def _collect_ctraces(self) -> None:
        """ Collect contract traces for the boosted inputs """
        # contract traces are already collected
        if self.conf.reuse_ctraces:
            assert len(self.ctraces) == len(self.boosted_inputs), "No ctraces to reuse"
            return

        # records same ctrace for all members of the same input class
        if self.conf.enable_fast_contract_tracing:
            self.ctraces = self._non_boosted_ctraces * CONF.inputs_per_class
            return

        # compute ctraces separately for every boosted input
        self.ctraces = \
            self.fuzzer.model.trace_test_case(self.boosted_inputs, self.conf.model_nesting)

    def _collect_htraces(self) -> None:
        """ Collect hardware traces for the boosted inputs """
        new_htraces = self.fuzzer.executor.trace_test_case(self.boosted_inputs,
                                                           self.conf.executor_n_reps)
        if not self.conf.extend_htraces:
            self.htraces = new_htraces
            return

        # Merge new htraces with the existing ones
        assert len(self.htraces) == len(new_htraces), "Number of htraces does not match"
        for i, htrace in enumerate(new_htraces):
            self.htraces[i] = htrace.merge(self.htraces[i])

    def _check_violations(self) -> None:
        """ Check the collected traces for contract violations """
        assert self.ctraces and len(self.ctraces) == len(self.htraces), \
            f"Invalid number of c- or htraces: {len(self.ctraces)} vs {len(self.htraces)}"
        self.violations = self.fuzzer.analyser.filter_violations(
            ctraces=self.ctraces,
            htraces=self.htraces,
            test_case_code=self.test_case,
            inputs=self.boosted_inputs,
            stats_=self.conf.record_stats)

    def _update_ignore_list(self) -> None:
        """
        Label all non-violating inputs as ignored by executor, so that we don't trigger
        a chain reaction of false positives when the measurement results are non-deterministic
        """
        if self.conf.update_ignore_list:
            violating_ids = [m.input_id for v in self.violations for m in v.measurements]
            ignored_input_ids = [
                i for i in range(len(self.boosted_inputs)) if i not in violating_ids
            ]
            self.fuzzer.executor.extend_ignore_list(ignored_input_ids)

    def _priming_check(self) -> None:
        """
        Perform a priming check, as described next.

        Goal: Distinguish between violations caused by input data leaks and those caused by
        cross-talk between inputs.

        Approach: The priming check swaps the inputs that caused the violation with each other and
        checks if the violation is still present. If the violation is still present, it is a genuine
        violation; otherwise, it is a false positive.

        Example: Given a violation caused by an input sequence (i1, i2, i1', i2'), where inputs
        i2 and i2' produce the same contract trace but different hardware traces, hence causing a
        violation. The violation could be caused either by the difference in the input data of
        i2 vs i2', or it could be caused by the difference in the microarchitectural state
        created by i1 vs i1'. The former is a genuine violation, while the latter is a false
        positive.

        To distinguish between the two, the priming check creates two new sequences:
        (i1, i2', i1', i2') and (i1, i2, i1', i2).

        If the trace produced by the first instance of i2' in the first sequence matches
        the trace produced by i2' in the original sequence, AND
        the trace produced by the second instance of i2 in the second sequence matches
        the trace produced by i2 in the original sequence,
        then the violation is genuine.
        """

        while self.violations:
            self.fuzzer.log.priming(len(self.violations))

            violation: Violation = self.violations.pop()
            n_reps = violation.measurements[0].htrace.sample_size()
            measurements_to_test = [hc[0] for hc in violation.get_hw_classes()]

            for current_measurement in measurements_to_test:
                current_input_id = current_measurement.input_id
                htrace_to_reproduce = current_measurement.htrace
                other_measurements = [m for m in measurements_to_test if m != current_measurement]

                # list of inputs that produced a different HTrace
                input_ids_to_test: List[int] = [m.input_id for m in other_measurements]

                # iterate over inputs in the violation and swap them with current_input_id
                for input_id in input_ids_to_test:
                    self.fuzzer.log.dbg_priming_progress(input_id, current_input_id)

                    # insert the tested input into its new place
                    primer = list(self.boosted_inputs)
                    primer[current_input_id] = self.boosted_inputs[input_id]

                    # try the new input sequence and check if the traces observed for the new input
                    # are equivalent to the original ones
                    htraces: List[HTrace] = self.fuzzer.executor.trace_test_case(primer, n_reps)
                    new_htrace = htraces[current_input_id]

                    # fast exit in case of a tracing error
                    if new_htrace.is_empty() or new_htrace.is_corrupted_or_ignored():
                        warning("fuzzer", "Tracing error during priming. "
                                "Skipping this test case")
                        self.violations = []
                        return

                    if self.fuzzer.analyser.htraces_are_equivalent(new_htrace, htrace_to_reproduce):
                        continue

                    self.fuzzer.log.dbg_priming_fail(input_id, current_input_id,
                                                     htrace_to_reproduce, new_htrace)

                    # could not reproduce; it's a genuine violation
                    self.violations = [violation]
                    return

            # all traces were reproduced, so it's a false positive
            self.violations = []
            return

    def _check_for_architectural_mismatch(self) -> None:
        """
        Check if the given test cases causes an architectural mismatch between the model
        and the executor. For example, this may happen if the model incorrectly emulates the
        execution of an instruction due to a bug in the emulator.
        """
        hardware_regs: List[List[int]] = []
        model_regs: List[List[int]] = []

        self.fuzzer.arch_model.load_test_case(self.test_case)
        self.fuzzer.arch_executor.load_test_case(self.test_case)

        # This function may be called standalone (see ArchitecturalFuzzer),
        # in which case boosted_inputs are not yet set
        if not self.boosted_inputs:
            self.boosted_inputs = self.org_inputs

        # Collect architectural hardware traces
        try:
            htraces = self.fuzzer.arch_executor.trace_test_case(self.boosted_inputs, n_reps=1)
        except IOError:
            warning("fuzz", "Error during architectural mismatch check. Skipping this test case")
            self.arch_violations = []  # skip test case in case of a tracing error
            return
        for htrace_obj in htraces:
            raw_traces = htrace_obj.get_raw_readings()
            assert len(raw_traces) == 1, "Expected only one hardware trace"
            raw_trace_int = [int(v) for v in raw_traces[0]]
            hardware_regs.append(raw_trace_int)

        # Collect architectural model traces
        ctraces = self.fuzzer.arch_model.trace_test_case(self.boosted_inputs,
                                                         CONF.model_max_nesting)
        for ctrace in ctraces:
            model_regs.append([v % (2**64) for v in ctrace.get_untyped()[:6]])

        # Debug outputs
        self.fuzzer.log.dbg_dump_architectural_traces(hardware_regs, model_regs)

        # Check for violations
        # Note: since we simply check the equality of traces, we don't need to invoke the analyser
        for i, input_ in enumerate(self.boosted_inputs):
            if model_regs[i] == hardware_regs[i]:
                continue
            measurement = TraceBundle(i, input_, ctraces[i], htraces[i])
            violation = Violation([measurement], self.boosted_inputs, self.test_case)
            violation.set_trivial_hw_classes()
            self.arch_violations = [violation]
            return
        return


# ==================================================================================================
# Public: Fuzzer
# ==================================================================================================
class Fuzzer:
    """
    The main class that orchestrates the fuzzing process. It creates all necessary modules
    and takes care of invoking them in the right order and passing the data between them.

    The main interface to start fuzzing is the `start` method, which implements a multi-stage
    algorithm to detect contract violations. The method implements the core fuzzing loop, which
    is to generate a test case, prepare inputs, collect their traces, and check for violations.

    The class also provides a set of stand-alone interfaces for generating test cases, analyzing
    traces from files, and filtering out non-useful test cases.
    """

    model: Model
    executor: Executor
    asm_parser: AsmParser
    code_gen: CodeGenerator
    data_gen: DataGenerator
    analyser: Analyser
    elf_parser: ELFParser

    arch_executor: Executor
    arch_model: Model
    log: FuzzLogger

    _isa_spec: InstructionSet
    _existing_test_case: str
    _work_dir: str
    _input_paths: List[str]
    _generation_function: Callable[[str], TestCaseProgram]

    def __init__(self,
                 instruction_set_spec: str,
                 work_dir: str,
                 existing_test_case: str = "",
                 input_paths: Optional[List[str]] = None):
        self._adjust_config(existing_test_case)

        self._existing_test_case = existing_test_case
        self._input_paths = input_paths if input_paths is not None else []
        self._work_dir = work_dir

        # Create all main modules
        self.log = FuzzLogger()
        self._isa_spec = InstructionSet(instruction_set_spec, CONF.instruction_categories)
        self.code_gen = factory.get_program_generator(CONF.program_generator_seed, self._isa_spec)
        self.data_gen = factory.get_data_generator(CONF.data_generator_seed)
        self.executor = factory.get_executor()
        self.model = factory.get_model(self.executor.read_base_addresses())
        self.analyser = factory.get_analyser()
        self.asm_parser = factory.get_asm_parser(self._isa_spec)
        self.elf_parser = factory.get_elf_parser()

        self.arch_executor = factory.get_executor(enable_mismatch_check_mode=True)
        self.arch_model = factory.get_model(
            self.arch_executor.read_base_addresses(), enable_mismatch_check_mode=True)

    # ==============================================================================================
    # Fuzzing Interface
    def start(self, num_test_cases: int, num_inputs: int, timeout: int, nonstop: bool,
              save_violations: bool, type_: FuzzingMode) -> bool:
        """
        Start the fuzzing process with the given parameters.
        :param num_test_cases: the number of test cases to be generated
        :param num_inputs: the number of inputs to be generated for each test case
        :param timeout: the maximum time (in seconds) to run the fuzzer
        :param nonstop: whether to continue the fuzzing process after the first violation
        :param save_violations: whether to store the violation artifacts
        :param type_: the type of fuzzing to be performed (random, template, asm)
        :return: True if at least one violation was detected, False otherwise
        """
        # Print header
        start_time = datetime.today()
        self.log.start(num_test_cases, start_time)

        # Find an appropriate generation function
        self._set_generation_function(type_)

        # Start the fuzzing loop
        for i in range(num_test_cases):
            self.log.start_round(i)

            # Generate a test case
            test_case: TestCaseProgram = self._generation_function(self._existing_test_case)
            STAT.test_cases += 1

            # Prepare inputs
            inputs: List[InputData]
            if self._input_paths:
                inputs = self.data_gen.load(self._input_paths)
            else:
                inputs = self.data_gen.generate(num_inputs, n_actors=test_case.n_actors())
            STAT.num_inputs += len(inputs) * CONF.inputs_per_class

            # Check if the test case is useful
            if self._filter(test_case, inputs):
                continue

            # Fuzz the test case
            violation = self.fuzzing_round(test_case, inputs, [])
            if violation:
                self.log.report_violations(violation)
                self.log.dbg_violation(violation, self.model)
                if save_violations:
                    self._store_violation_artifact(violation, self._work_dir)
                STAT.violations += 1
                if not nonstop:
                    break

            # Terminate the fuzzer if the timeout has expired
            if timeout:
                now = datetime.today()
                if (now - start_time).total_seconds() > timeout:
                    self.log.timeout()
                    break

        self.log.finish()
        self.log.report_model_coverage(self.model)
        return STAT.violations > 0

    def fuzzing_round(self, test_case: TestCaseProgram, inputs: List[InputData],
                      starting_ignore_list: List[int]) -> Optional[Violation]:
        """
        Run a single fuzzing round: collect contract and hardware traces for the given test
        case and inputs, and check for contract violations.

        The function is typically used as a part of the fuzzing loop
        (invoked by .start), but can be also used stand-alone by other classes.

        The function implements a multi-stage approach to testing, with the first measurement being
        fast but with a chance of false positives, and the later stages filtering out various
        types of potential false positives. The exact number of stages depends on
        the configuration.

        :param test_case: the test case to be executed
        :param inputs: the inputs to be tested
        :param starting_ignore_list: a list of input IDs to be ignored by the executor
        :return: the first detected violation or None if no violations were found
        """
        # pylint: disable=too-many-return-statements

        # Initialize the round manager and load the test case
        round_manager = _RoundManager(self, test_case, inputs)

        # If a list of ignored inputs is provided, set it in the executor
        if starting_ignore_list:
            self.executor.set_ignore_list(starting_ignore_list)

        # 1. Fast path: Collect traces with minimal nesting and repetitions
        round_manager.execute_stage("fast")
        if not round_manager.violations:
            STAT.fast_path += 1
            round_manager.finalize()
            return None

        # 2. Slow path: Go through potential sources of false violations in the fast path,
        #    and check them one at a time, starting with the most likely ones
        self.log.slow_path()

        # 2.1 FP might appear because the model did not go deep enough into nested speculation.
        #     To remove such FPs, we re-run the model tracing with max nesting. As taints depend on
        #     contract traces, we also have to re-boost the inputs, and re-collect hardware traces
        #     for the new inputs
        round_manager.execute_stage("nesting")
        if not round_manager.violations:
            STAT.fp_nesting += 1
            round_manager.finalize()
            return None

        # 2.2 FP might appear because of imperfect tainting (e.g., due to a bug in taint tracker).
        #     To remove such FPs, we collect contract traces for all boosted inputs, and check if
        #     the violation is still present
        prev_ctraces = list(round_manager.ctraces)
        round_manager.execute_stage("taint_mistake")
        if not round_manager.violations:
            if round_manager.ctraces != prev_ctraces:  # this should not normally happen
                self._report_bug_tainting(round_manager)
            STAT.fp_taint_mistakes += 1
            round_manager.finalize()
            return None

        # 2.3 FP might appear because of interference between inputs. To remove such FPs, we
        #     use the priming test where we swap inputs that caused the violation with each other
        round_manager.execute_stage("priming")
        if not round_manager.violations:
            STAT.fp_priming += 1
            round_manager.finalize()
            return None

        # 2.4 FP might appear because we experienced noise. Retry the experiment with a larger
        #     sample size to reduce the impact of noise
        round_manager.execute_stage("noise")
        if not round_manager.violations:
            STAT.fp_large_sample += 1
            return None

        # 2.5 Priming might have failed because the sample size was too small, causing
        #     non-deterministic results. Retry the priming test with the largest sample size
        round_manager.execute_stage("priming_large")
        if not round_manager.violations:
            STAT.fp_priming += 1
            round_manager.finalize()
            return None

        # 2.6 FP might appear because of a mismatch between the model and the executor.
        # Such cases are rare, hence we check for them last.
        # To remove such FPs, we check if the violation is caused by an architectural mismatch
        round_manager.execute_stage("arch_mismatch")
        if round_manager.arch_violations:
            self._report_bug_arch(round_manager)
            round_manager.finalize()
            return None

        # Violation survived all checks. Report it
        round_manager.finalize()
        return round_manager.violations[0]

    # ==============================================================================================
    # Single-stage Interfaces
    def standalone_filter(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        """ Check if the given test case should be filtered out """
        return self._filter(test_case, inputs)

    def standalone_generate(self, program_generator_seed: int, num_test_cases: int, num_inputs: int,
                            permit_overwrite: bool) -> None:
        """
        Run a standalone test case generation and store the generated test case programs
        and their inputs in the work directory
        """
        self.log.start(0, datetime.today())

        # prepare for generation
        STAT.test_cases = num_test_cases
        CONF.program_generator_seed = program_generator_seed
        program_gen = factory.get_program_generator(CONF.program_generator_seed, self._isa_spec)
        data_gen = factory.get_data_generator(CONF.data_generator_seed)

        # generate test cases
        Path(self._work_dir).mkdir(exist_ok=True)
        for i in range(0, num_test_cases):
            test_case_dir = self._work_dir + "/tc" + str(i)
            try:
                Path(test_case_dir).mkdir(exist_ok=permit_overwrite)
            except FileExistsError:
                raise FileExistsError(f"Directory '{test_case_dir}' already exists\n"
                                      "       Use --permit-overwrite to overwrite the test case")

            program_gen.create_test_case(test_case_dir + "/" + "program.asm", True)
            inputs = data_gen.generate(num_inputs, n_actors=1)
            for j, input_ in enumerate(inputs):
                input_.save(f"{test_case_dir}/input{j}.bin")

        self.log.finish()

    def standalone_analyse(self, ctrace_file: str, htrace_file: str) -> None:
        """ Check the contract and hardware traces in the given files for contract violations """
        if "dbg_violation" in CONF.logging_modes:
            CONF.logging_modes.remove("dbg_violation")
            update_logging_after_config_change()

        self.log.start(0, datetime.today())
        STAT.test_cases = 1

        # read traces
        ctraces: List[CTrace] = []
        htraces: List[HTrace] = []

        with open(ctrace_file, 'r') as f:
            for line in f:
                ctraces.append(CTrace([CTraceEntry("val", int(line))]))
        with open(htrace_file, 'r') as f:
            for line in f:
                sample: ArrayOfSamples = np.ndarray(1, dtype=RawHTraceSample)
                sample[0]['trace'] = int(line)
                htraces.append(HTrace(sample))

        assert len(ctraces) == len(htraces), \
            "The number of hardware traces does not match the number of contract traces"

        dummy_inputs = factory.get_data_generator(0).generate(len(ctraces), n_actors=1)
        dummy_tc = TestCaseProgram("generated.asm", 0)

        # check for violations
        analyser = factory.get_analyser()
        violations = analyser.filter_violations(ctraces, htraces, dummy_tc, dummy_inputs, True)

        # print results
        if violations:
            self.log.report_violations(violations[0])

        self.log.finish()

    # ==============================================================================================
    # Private Methods
    def _set_generation_function(self, type_: FuzzingMode) -> None:
        """ Set the generation function based on the fuzzing mode """
        if type_ == "random":
            self._generation_function = self.code_gen.create_test_case
        elif type_ == "template":
            self._generation_function = self.code_gen.create_test_case_from_template
        elif type_ == "asm":
            self._generation_function = self._asm_parser_adapter
        else:
            assert_never(f"Unknown fuzzing mode: {type_}")

    @staticmethod
    def _create_timestamped_dir(path: str) -> str:
        timestamp = datetime.today().strftime('%y%m%d-%H%M%S')
        violation_dir = f"{path}/violation-{timestamp}"
        Path(path).mkdir(exist_ok=True)
        Path(violation_dir).mkdir()
        return violation_dir

    def _store_violation_artifact(self, violation: Violation, path: str) -> None:
        """
        Store a violation artifact into the given directory.

        A violation artifact consists of:
        - the test case that caused the violation (program.asm)
        - the inputs that caused the violation (input_*.bin)
        - the original configuration file (org-config.yaml)
        - the configuration file for reproducing violation from artifact (reproduce.yaml)
        - the configuration file for minimization (minimize.yaml)

        :param violation: the violation to be stored
        :param path: the path to the directory where the artifact should be stored;
                    if empty, the artifact is stored in the current directory
        """
        # if the path is empty, store the artifact in the current directory
        if not path:
            path = "."

        # create a subdirectory for the violation artifact
        violation_dir = self._create_timestamped_dir(path)

        # store violation
        test_case = violation.test_case_code
        test_case.save(f"{violation_dir}/program.asm")
        for i, input_ in enumerate(violation.input_sequence):
            input_.save(f"{violation_dir}/input_{i:04}.bin")

        # store the original configuration file
        if CONF._config_path:
            shutil.copy2(CONF._config_path, f"{violation_dir}/org-config.yaml")
        else:
            with open(f"{violation_dir}/org-config.yaml", "w") as f:
                f.write("# Original violation used a default config, hence this file is empty\n")

        # create patched configs for reproducing and minimizing the violation
        shutil.copy2(f"{violation_dir}/org-config.yaml", f"{violation_dir}/reproduce.yaml")
        with open(f"{violation_dir}/reproduce.yaml", "a") as f:
            f.write("\n# Overwrite some of the configuration options to reproduce the violation\n")
            f.write(f"data_generator_seed: {violation.input_sequence[0].seed}\n")
            f.write("inputs_per_class: 1\n")
        shutil.copy2(f"{violation_dir}/org-config.yaml", f"{violation_dir}/minimize.yaml")
        with open(f"{violation_dir}/minimize.yaml", "a") as f:
            f.write("\n# Overwrite some of the configuration options to reproduce the violation\n")
            f.write(f"data_generator_seed: {violation.input_sequence[0].seed}\n")

        # we're about to store stats into a file - disable colors
        color_on = CONF.color
        CONF.color = False

        # store the violation report
        with open(f"{violation_dir}/report.txt", "w") as f:
            f.write("# Violation Report\n\n")
            f.write(f"* Test Case ID: {STAT.test_cases - 1}\n")
            f.write(f"* Detected: {datetime.today().strftime('%d.%m.%y at %H:%M:%S')}\n\n")
            f.write("* Time to detection:"
                    f" {(datetime.today() - self.log.start_time).total_seconds()}\n")
            f.write("* Statistics:\n")
            f.write(str(STAT) + "\n")

            f.write("\n## Generation Properties\n")
            f.write(f"* Program seed: {test_case.generator_seed}\n")
            f.write(f"* Input seed: {violation.input_sequence[0].seed}\n")
            f.write("* Faulty page properties:\n")
            target_desc = self.code_gen._target_desc
            for actor in test_case.get_actors(sorted_=True):
                actor_id = actor.get_id()
                f.write(f"  - Actor {actor_id}:\n")

                pte_fields = []
                for field in target_desc.pte_bits:
                    offset, default = target_desc.pte_bits[field]
                    value = bool(actor.data_properties & (1 << offset))
                    if value != default:
                        pte_fields.append(f"{field}={value}")
                f.write(f"    * PTE: {'; '.join(pte_fields)}\n")

                if actor.mode != ActorMode.GUEST:
                    continue
                vm_pte_fields = []
                for field in target_desc.vm_pte_bits:
                    offset, default = target_desc.vm_pte_bits[field]
                    value = bool(actor.data_ept_properties & (1 << offset))
                    if value != default:
                        vm_pte_fields.append(f"{field}={value}")
                f.write(f"    * EPTE: {'; '.join(vm_pte_fields)}\n")

            f.write("\n## Counterexample Inputs\n")
            for m in violation.measurements:
                f.write(f"\nInput #{m.input_id}\n")
                f.write(f"* Hardware trace:\n {m.htrace.full_str()}\n")
                f.write(f"* Contract trace (hash): {m.ctrace}\n")
                f.write(f"* Contract trace (detailed): {m.ctrace.full_str()}\n")

        # re-enable colors if enabled previously
        CONF.color = color_on

    def _report_bug_tainting(self, round_manager: _RoundManager) -> None:
        warning("fuzzer", "Fast path contract traces do not match the full traces")
        if self._work_dir and CONF.is_generation_enabled():
            warning("fuzzer", f"Storing the bug into {self._work_dir}/bugs/")

            # note that we don't use _store_violation_artifact here because there is no actual
            # violation - we just want to store the test case and inputs
            violation_dir = self._create_timestamped_dir(f"{self._work_dir}/bugs/")
            round_manager.test_case.save(f"{violation_dir}/program.asm")
            for i, input_ in enumerate(round_manager.org_inputs):
                input_.save(f"{violation_dir}/input_{i:04}.bin")

    def _report_bug_arch(self, round_manager: _RoundManager) -> None:
        warning("fuzzer", "Architectural mismatch between model and executor detected")
        if self._work_dir and CONF.is_generation_enabled():
            warning("fuzzer", f"Storing the bug into {self._work_dir}/bugs/")
            self._store_violation_artifact(round_manager.violations[0], f"{self._work_dir}/bugs/")

    # ----------------------------------------------------------------------------------------------
    # Private: Subclass hooks for ISA-specific customization
    def _filter(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        """
        A filter function that can be used to check if a test case is not useful.

        The function is typically used as a part of the fuzzing loop
        (invoked by self.start_* methods), but can be also used stand-alone by other classes.

        :param test_case: The test case to be checked
        :param inputs: The inputs to be used with the test case
        :return: True if the test case should be filtered out (not useful), False otherwise (useful)
        """
        return False  # implemented by architecture-specific subclasses

    def _adjust_config(self, _: str) -> None:
        """ Adjust the configuration based on the given test case """

    def _asm_parser_adapter(self, asm: str) -> TestCaseProgram:
        # FIXME: this is a hack to fit the interface; refactor this
        return self.asm_parser.parse_file(asm, self.code_gen, self.elf_parser)


class ArchitecturalFuzzer(Fuzzer):
    """
    A simplified fuzzer that checks for architectural mismatches between the model and the
    executor. This fuzzer is useful for detecting bugs in Revizor, but it cannot detect
    contract violations.

    The fuzzer piggy-backs on the check_for_architectural_mismatch function of Fuzzer
    to check for mismatches.
    """

    def __init__(self,
                 instruction_set_spec: str,
                 work_dir: str,
                 existing_test_case: str = "",
                 inputs: Optional[List[str]] = None):
        super().__init__(instruction_set_spec, work_dir, existing_test_case, inputs)
        warning("fuzzer", "Running in architectural mode. "
                "Contract violations can't be detected!")

    def fuzzing_round(self, test_case: TestCaseProgram, inputs: List[InputData],
                      _: List[int]) -> Optional[Violation]:
        """
        Run a single fuzzing round: collect contract and hardware traces for the given test
        case and inputs, and check for architectural mismatches.
        """
        round_manager = _RoundManager(self, test_case, inputs)
        round_manager.execute_stage("arch_mismatch")
        return round_manager.arch_violations[0] if round_manager.arch_violations else None


class ArchDiffFuzzer(Fuzzer):
    """
    Fuzzer that compares the execution of a test case with and without speculation fences.
    If the results differ, it reports a violation.

    Used to detect architectural bugs caused by speculative execution.
    """

    def fuzzing_round(self, test_case: TestCaseProgram, inputs: List[InputData],
                      _: List[int]) -> Optional[Violation]:
        # collect non-fenced traces
        self.arch_executor.load_test_case(test_case)
        reg_values: List[List[int]] = []
        try:
            htraces: List[HTrace] = self.arch_executor.trace_test_case(inputs, 1)
        except IOError:
            return None
        for htrace in htraces:
            reg_values.append(htrace.get_raw_readings()[0].tolist())

        # collect fenced traces
        with tempfile.NamedTemporaryFile(delete=False) as fenced:
            fenced_name = fenced.name
        fenced_test_case = self._create_fenced_test_case(test_case.asm_path(), fenced_name,
                                                         self.asm_parser, self.code_gen,
                                                         self.elf_parser)
        self.arch_executor.load_test_case(fenced_test_case)
        fenced_reg_values: List[List[int]] = []
        try:
            htraces = self.arch_executor.trace_test_case(inputs, 1)
        except IOError:
            return None
        for htrace in htraces:
            fenced_reg_values.append(htrace.get_raw_readings()[0].tolist())
        os.remove(fenced_name)

        for i, input_ in enumerate(inputs):
            if fenced_reg_values[i] == reg_values[i]:
                if "dbg_dump_htraces" in CONF.logging_modes:
                    print(f"Input #{i}")
                    print(f"Fenced:       {list(fenced_reg_values[i])}")
                    print(f"Non-fenced:   {list(reg_values[i])}")
                continue

            if "dbg_violation" in CONF.logging_modes:
                print(f"Input #{i}")
                print(f"Fenced:       {list(fenced_reg_values[i])}")
                print(f"Non-fenced:   {list(reg_values[i])}")

            return Violation.pseudo_violation_from_inputs([input_], test_case)
        return None

    @staticmethod
    def _create_fenced_test_case(original_asm: str, fenced_asm: str, asm_parser: AsmParser,
                                 generator: CodeGenerator,
                                 elf_parser: ELFParser) -> TestCaseProgram:
        """
        Hook function to create a test case with speculation fences."
        Must be implemented by ISA-specific subclasses that know what a fence looks like for
        their architecture.
        """

        raise NotImplementedError("This method should be implemented by the subclass")


================================================
FILE: rvzr/instruction_spec.py
================================================
"""
File: Collection of classes that represent instruction specifications.
The specifications typically originate from a JSON ISA spec file.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from dataclasses import dataclass
from enum import Enum
from typing import List, Final, Tuple, Literal, Optional


class OT(Enum):
    """
    Enumeration class representing an Operand Type (OT) of an instruction.
    """
    REG = 1  # Register Operand
    MEM = 2  # Memory Operand
    IMM = 3  # Immediate Operand
    LABEL = 4  # Label Operand
    AGEN = 5  # Memory address in LEA instructions
    FLAGS = 6  # Flags Operand
    COND = 7  # Condition Operand

    def __str__(self) -> str:
        return str(self._name_)  # pylint: disable=no-member  # This is an intended private use


XOT = Literal["f64", "f32", "f16", "2f16", "bf16", "int", "i64", "i32", "i16", "i8", "u256", "u128",
              "u64", "u32", "u16", "u8"]
""" Extended Operand Type (XOT) provides extra information (sign, type) about the operand. """


@dataclass
class OperandSpec:
    """
    Specification of an operand in an instruction.
    Typically used in connection with an InstructionSpec.
    """

    values: Final[Tuple[str, ...]]
    """ List of operand values (e.g., register names, immediate values). """

    type: Final[OT]
    """ Type of the operand (e.g., register, memory, immediate). """

    xtype: Final[Optional[XOT]]
    """ Extended type of a SIMD register operand (e.g., packed double-precision FP is f64) """

    width: Final[int]
    """ Width of the operand in bits, if applicable (e.g., 64 for 64-bit register). """

    src: bool
    """ Indicates if the operand is a source; i.e., if it is read by the instruction. """

    dest: bool
    """ Indicates if the operand is a destination; i.e., if it is written by the instruction. """

    is_signed: Final[bool]
    """ Indicates if the operand is signed. """

    has_magic_value: Final[bool]
    """ Indicates if the operand has a special value that requires unique handling.
    (e.g., separate opcode when RAX is a destination)
    """

    def __init__(self,
                 values: List[str],
                 type_: OT,
                 src: bool,
                 dest: bool,
                 width: int = 0,
                 is_signed: bool = True,
                 has_magic_value: bool = False,
                 xtype: Optional[XOT] = None):
        self.values = tuple(values)
        self.type = type_
        self.src = src
        self.dest = dest
        self.width = width
        self.is_signed = is_signed
        self.has_magic_value = has_magic_value
        self.xtype = xtype

    def __str__(self) -> str:
        return "(" + ", ".join(self.values) + ")"


@dataclass
class InstructionSpec:
    """
    Specification of an instruction.
    Typically originates from a JSON specification file (base.json).
    """

    name: Final[str]
    """ Name of the instruction. """

    category: Final[str]
    """ Category of the instruction. Originates from the JSON specification file. """

    is_control_flow: Final[bool]
    """ Indicates if the instruction alters control flow (e.g., jumps, calls). """

    operands: List[OperandSpec]
    """ List of explicit operands for the instruction. """

    implicit_operands: List[OperandSpec]
    """ List of implicit operands for the instruction. """

    has_mem_operand: bool = False
    """ Indicates if the instruction has a memory operand. """

    has_write: bool = False
    """ Indicates if the instruction writes to a destination operand. """

    has_magic_value: bool = False
    """ Indicates if the instruction has a special value that requires unique handling. """

    def __init__(self, name: str, category: str, is_control_flow: bool = False):
        self.name = name
        self.category = category
        self.is_control_flow = is_control_flow

        self.operands = []
        self.implicit_operands = []

    def __str__(self) -> str:
        ops = ""
        for o in self.operands:
            ops += str(o) + " "
        return f"{self.name} {ops}"

    def __hash__(self) -> int:
        return hash(str(self))


================================================
FILE: rvzr/isa_spec.py
================================================
"""
File:

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
import json
from copy import deepcopy
from typing import Dict, List, Optional, Any, get_args

from .instruction_spec import OT, XOT, OperandSpec, InstructionSpec
from .config import CONF
from .logs import ISALogger

_OT_STR_TO_ENUM = {
    "REG": OT.REG,
    "MEM": OT.MEM,
    "IMM": OT.IMM,
    "LABEL": OT.LABEL,
    "AGEN": OT.AGEN,
    "FLAGS": OT.FLAGS,
    "COND": OT.COND,
}

_FP_XOT = ["f64", "f32", "f16", "2f16"]
_BFP_XOT = ["bf16"]


class InstructionSet:
    """
    Class representing an instruction set of a given architecture.
    Contains a list of InstructionSpec objects as well as type-based lists of instructions.
    """

    instructions: List[InstructionSpec]
    instructions_unfiltered: List[InstructionSpec]
    logger: ISALogger

    has_unconditional_branch: bool = False
    has_conditional_branch: bool = False
    has_indirect_branch: bool = False
    has_reads: bool = False
    has_writes: bool = False

    control_flow_specs: List[InstructionSpec]
    non_control_flow_specs: List[InstructionSpec]
    non_memory_access_specs: List[InstructionSpec]
    load_instruction: List[InstructionSpec]
    store_instructions: List[InstructionSpec]
    cond_branches: List[InstructionSpec]

    def __init__(self, filename: str, include_categories: Optional[List[str]] = None):
        self.instructions = []
        _read_json_spec(self, filename)
        self.instructions_unfiltered = deepcopy(self.instructions)
        _reduce(self, include_categories)
        _set_isa_properties(self)
        _dedup(self)
        _set_categories(self)

    def get_return_spec(self) -> InstructionSpec:
        """ Return the instruction spec for the RET instruction on the given architecture """
        if CONF.instruction_set == "x86-64":
            return InstructionSpec("ret", "BASE-RET", is_control_flow=True)
        if CONF.instruction_set == "arm64":
            return InstructionSpec("ret", "general-ret", is_control_flow=True)
        raise NotImplementedError(f"Unsupported instruction set: {CONF.instruction_set}")

    def get_unconditional_jump_spec(self) -> InstructionSpec:
        """
        Return the instruction spec for the unconditional jump instruction
        on the given architecture
        """
        if CONF.instruction_set == "x86-64":
            spec = InstructionSpec("jmp", "BASE-UNCOND_BR", is_control_flow=True)
            spec.operands.append(OperandSpec([], OT.LABEL, src=True, dest=False, width=64))
            return spec
        if CONF.instruction_set == "arm64":
            spec = InstructionSpec("b", "general-uncond_branch", is_control_flow=True)
            spec.operands.append(OperandSpec([], OT.LABEL, src=True, dest=False, width=64))
            return spec
        raise NotImplementedError(f"Unsupported instruction set: {CONF.instruction_set}")


# ==================================================================================================
# Local service functions that post-process the instruction set
# ==================================================================================================
def _read_json_spec(isa: InstructionSet, filename: str) -> None:
    with open(filename, "r") as f:
        root = json.load(f)
    for instruction_node in root:
        instruction = InstructionSpec(instruction_node["name"], instruction_node["category"],
                                      instruction_node["is_control_flow"])

        for op_node in instruction_node["operands"]:
            op = _parse_json_operand(op_node, instruction)
            instruction.operands.append(op)
            if op.has_magic_value:
                instruction.has_magic_value = True

        for op_node in instruction_node["implicit_operands"]:
            op = _parse_json_operand(op_node, instruction)
            instruction.implicit_operands.append(op)

        isa.instructions.append(instruction)


def _parse_json_operand(op: Dict[str, Any], parent: InstructionSpec) -> OperandSpec:
    op_type = _OT_STR_TO_ENUM[op["type_"]]
    op_values = op.get("values", [])
    if op_type == OT.REG:
        op_values = sorted(op_values)

    spec = OperandSpec(
        values=op_values,
        type_=op_type,
        src=op["src"],
        dest=op["dest"],
        width=op["width"],
        is_signed=op.get("is_signed", True),
        xtype=op.get("xtype", None),
    )

    if op_type == OT.MEM:
        parent.has_mem_operand = True
        if spec.dest:
            parent.has_write = True

    return spec


def _reduce(isa: InstructionSet, include_categories: Optional[List[str]]) -> None:
    """ Remove unsupported instructions and operand values """

    def is_supported(spec: InstructionSpec) -> bool:
        # pylint: disable=too-many-return-statements
        # This is justified as it is a filtering function

        if not CONF.is_generation_enabled():
            # if we use an existing test case, then instruction filtering is irrelevant
            return True

        # allowlist has priority over blocklist
        if spec.name in CONF.instruction_allowlist:
            return True

        if include_categories and spec.category not in include_categories:
            logger.dbg_dump_filtering_reason(spec, "category not in include_categories")
            return False

        if spec.name in CONF.instruction_blocklist:
            logger.dbg_dump_filtering_reason(spec, "in instruction_blocklist")
            return False

        for operand in spec.operands:
            if operand.type == OT.MEM and operand.values \
                    and operand.values[0] in register_blocklist:
                logger.dbg_dump_filtering_reason(spec, "mem operand uses blocked register")
                return False

        # FP SIMD is not supported
        for operand in spec.operands:
            if operand.type != OT.REG or operand.xtype is None:
                continue
            assert operand.xtype in get_args(XOT), f"Unknown xtype value: {operand.xtype}"
            if operand.xtype in _FP_XOT or operand.xtype in _BFP_XOT:
                logger.dbg_dump_filtering_reason(spec, "uses unsupported FP/SIMD registers")
                return False

        for implicit_operand in spec.implicit_operands:
            assert implicit_operand.type != OT.LABEL  # I know no such instructions
            if implicit_operand.type == OT.MEM \
                    and implicit_operand.values[0] in register_blocklist:
                logger.dbg_dump_filtering_reason(spec, "implicit mem operand uses blocked register")
                return False

            if implicit_operand.type == OT.REG \
                    and implicit_operand.values[0] in register_blocklist:
                assert len(implicit_operand.values) == 1
                logger.dbg_dump_filtering_reason(spec, "implicit reg operand uses blocked register")
                return False
        return True

    logger = ISALogger()

    # Identify which registers should not be used
    register_blocklist = set(CONF.register_blocklist) - set(CONF.register_allowlist)

    # Remove unsupported instructions
    skip_list = []
    for s in isa.instructions:
        if not is_supported(s):
            skip_list.append(s)
    for s in skip_list:
        isa.instructions.remove(s)

    # Remove unsupported operand values from operand specs;
    # If all operand values are unsupported, remove the instruction
    skip_list = []
    for s in isa.instructions:
        operands = list(s.operands)  # make a copy
        for op_id, op in enumerate(operands):
            # filtering applies only to registers
            if op.type != OT.REG:
                continue

            # identify supported registers
            op_values = sorted(list(set(op.values) - register_blocklist))

            # FIXME: temporary disabled generation of higher reg. bytes for x86
            for i, reg in enumerate(op_values):
                if reg[-1] == 'h':
                    op_values[i] = reg.replace('h', 'l')

            # no supported values -> skip this instruction
            if not op_values:
                skip_list.append(s)
                break

            # otherwise, update the operand
            s.operands[op_id] = OperandSpec(op_values, op.type, op.src, op.dest, op.width,
                                            op.is_signed, op.has_magic_value, op.xtype)
    for s in skip_list:
        isa.instructions.remove(s)


def _set_isa_properties(isa: InstructionSet) -> None:
    """
    Set properties of the instruction set that are used in the generation process.
    """
    for inst in isa.instructions:
        if inst.is_control_flow:
            if inst.category in ["BASE-UNCOND_BR", "general-uncond_branch"]:
                isa.has_unconditional_branch = True
            else:
                isa.has_conditional_branch = True
        elif inst.has_mem_operand:
            if inst.has_write:
                isa.has_writes = True
            else:
                isa.has_reads = True


def _dedup(isa: InstructionSet) -> None:
    """
    Instruction set spec may contain several copies of the same instruction.
    Remove them.
    """
    skip_list = set()
    n_instructions = len(isa.instructions)
    for i in range(n_instructions):
        for j in range(i + 1, n_instructions):
            inst1 = isa.instructions[i]
            inst2 = isa.instructions[j]
            if inst1.name == inst2.name and len(inst1.operands) == len(inst2.operands):
                match = True
                for k, op1 in enumerate(inst1.operands):
                    op2 = inst2.operands[k]

                    if op1.type != op2.type:
                        match = False
                        continue

                    if op1.values != op2.values:
                        match = False
                        continue

                    if op1.width != op2.width and op1.type != OT.IMM:
                        match = False
                        continue

                    # assert op1.src == op2.src
                    # assert op1.dest == op2.dest

                if match:
                    skip_list.add(inst1)

    for s in skip_list:
        isa.instructions.remove(s)


def _set_categories(isa: InstructionSet) -> None:
    isa.control_flow_specs = [i for i in isa.instructions if i.is_control_flow]
    # adjust the config to the available instruction set
    if len(isa.control_flow_specs) == 0:
        CONF.min_successors_per_bb = 1
        CONF.max_successors_per_bb = 1

    isa.non_control_flow_specs = [i for i in isa.instructions if not i.is_control_flow]
    assert isa.non_control_flow_specs, \
        "The instruction set is insufficient to generate a test case"

    isa.non_memory_access_specs = \
        [i for i in isa.non_control_flow_specs if not i.has_mem_operand]
    if CONF.avg_mem_accesses != 0:
        memory_access_instructions = \
            [i for i in isa.non_control_flow_specs if i.has_mem_operand]
        isa.load_instruction = [i for i in memory_access_instructions if not i.has_write]
        isa.store_instructions = [i for i in memory_access_instructions if i.has_write]
        assert isa.load_instruction or isa.store_instructions, \
               "The instruction set does not have memory accesses while `avg_mem_accesses > 0`"
    else:
        isa.load_instruction = []
        isa.store_instructions = []

    uncond_name = isa.get_unconditional_jump_spec().name.lower()
    isa.cond_branches = \
        [i for i in isa.control_flow_specs if i.name.lower() != uncond_name]


================================================
FILE: rvzr/logs.py
================================================
"""
File: Global classes that provide service to all Revizor modules

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
import sys
from datetime import datetime
from typing import TYPE_CHECKING, NoReturn, Dict, List, Optional, Set, Any, Final, Tuple
from pprint import pformat
from traceback import print_stack

from .config import CONF
from .stats import FuzzingStats

if TYPE_CHECKING:
    from .model import Model
    from .sandbox import SandboxLayout
    from .model_unicorn.execution_context import ModelExecutionState
    from .model_unicorn.speculator_abc import UnicornSpeculator
    from .model_unicorn.model import UnicornModel
    from .instruction_spec import InstructionSpec
    from .traces import HTrace, Violation, CTrace
    from .tc_components.test_case_data import InputData

MASK_64BIT = pow(2, 64)
POW2_64 = pow(2, 64)

RED = '\033[33;31m'
GREEN = '\033[33;32m'
YELLOW = '\033[33;33m'
BLUE = '\033[33;34m'
PURPLE = '\033[33;35m'
CYAN = '\033[33;36m'
GRAY = '\033[33;37m'
COL_RESET = "\033[0m"

M_COL = PURPLE
PC_COL = COL_RESET
VAL_COL = CYAN

HTRACE_R1_COL = CYAN
HTRACE_R2_COL = YELLOW

STAT = FuzzingStats()


# ==================================================================================================
# Private: Logging configuration
# ==================================================================================================
class _LoggingConfig:  # pylint: disable=too-few-public-methods  # because this is a data class
    """
    A global object responsible for keeping track of how stuff should be printed.
    This object is shared among all modules (via Borg pattern)
    and is used to determine the logging behavior.
    """
    _borg_shared_state: Dict[Any, Any] = {}

    redraw_mode: bool = True
    line_ending: str = ""

    # info modes
    info: bool = False
    stat: bool = False
    debug: bool = False

    # debugging specific modules
    dbg_timestamp: bool = False
    dbg_violation: bool = False
    dbg_dump_htraces: bool = False
    dbg_dump_ctraces: bool = False
    dbg_dump_traces_unlimited: bool = False
    dbg_executor_raw: bool = False
    dbg_model: bool = False
    dbg_coverage: bool = False
    dbg_generator: bool = False
    dbg_priming: bool = False
    dbg_isa_filter: bool = False

    dbg_model_print_id: bool = True

    _all_modes: List[str] = [
        "info", "stat", "dbg_timestamp", "dbg_violation", "dbg_dump_htraces", "dbg_dump_ctraces",
        "dbg_dump_traces_unlimited", "dbg_executor_raw", "dbg_model", "dbg_coverage",
        "dbg_generator", "dbg_priming", "dbg_isa_filter"
    ]

    def __init__(self) -> None:
        self.__dict__ = self._borg_shared_state
        if not self._borg_shared_state:
            self.update_logging_modes()
            self.line_ending = '\n' if CONF.multiline_output else ''
            self.redraw_mode = not CONF.multiline_output

    def update_logging_modes(self) -> None:
        """
        Function that adjust the logging configuration after
        a change has been made to the CONF object """
        # Check that all entries in the config a valid
        for mode in CONF.logging_modes:
            if not mode:  # skip empty values
                continue
            if mode not in self._all_modes:
                error(f"Unknown value '{mode}' of config variable 'logging_modes'")

        # Set the logging modes
        self.debug = False
        for mode in self._all_modes:
            val = mode in CONF.logging_modes
            setattr(self, mode, val)
            if "dbg" in mode:
                self.debug |= val

        # Check if Python is not running in optimized mode if debugging is required
        # (otherwise, the debug messages won't be printed)
        if not __debug__:
            dbg_required = any([
                self.dbg_timestamp, self.dbg_model, self.dbg_coverage, self.dbg_dump_htraces,
                self.dbg_dump_ctraces, self.dbg_generator, self.dbg_priming, self.dbg_executor_raw,
                self.dbg_isa_filter
            ])
            if dbg_required:
                warning(
                    "", "Current value of `logging_modes` requires debugging mode!\n"
                    "Remove '-O' from python arguments")


# ==================================================================================================
# Public interface to logging configuration
# ==================================================================================================
# create an initial instance of the logging configuration
# to be used by functions in this module
_LOG_CONF = _LoggingConfig()


def update_logging_after_config_change() -> None:
    """ Update the logging configuration after a change has been made to the CONF object """
    _LOG_CONF.update_logging_modes()


# ==================================================================================================
# Public: Simple logging functions
# ==================================================================================================
# FIXME: deprecated; use exceptions instead
def error(msg: str, print_tb: bool = False, print_last_tb: bool = False) -> NoReturn:
    """ Print an error message and exit the program """
    if _LOG_CONF.redraw_mode:
        print("")

    if print_tb:
        print("Encountered an unrecoverable error\nTraceback:")
        print_stack()
        print("\n")
    elif print_last_tb:
        print("Encountered an unrecoverable error\nTraceback:")
        print_stack(limit=3)
        print("\n")

    if CONF.color:
        print(f"{RED}ERROR:{COL_RESET} {msg}")
    else:
        print(f"ERROR: {msg}")
    sys.exit(1)


def warning(src: str, msg: str) -> None:
    """ Print a warning message """
    if _LOG_CONF.redraw_mode:
        print("")
    if CONF.color:
        print(f"{RED}WARNING:{COL_RESET} [{src}] {msg}")
    else:
        print(f"WARNING: [{src}] {msg}")


def inform(src: str, msg: str, end: str = "\n") -> None:
    """ Print a general information message """
    if _LOG_CONF.info:
        if _LOG_CONF.redraw_mode:
            print("")
        print(f"INFO: [{src}] {msg}", end=end, flush=True)


def dbg(src: str, msg: str) -> None:
    """ Print a debug message """
    if not __debug__:
        return
    if _LOG_CONF.debug:
        if _LOG_CONF.redraw_mode:
            print("")
        print(f"DBG: [{src}] {msg}")


# ==================================================================================================
# Public: Module-specific logging
# ==================================================================================================
class FuzzLogger:
    """ A class that provides logging services for the Fuzzer module """

    one_percent_progress: float = 0.0
    progress: float = 0.0
    progress_percent: int = 0
    msg: str = ""
    _msg_width: int = 0
    start_time: datetime
    _conf: Final[_LoggingConfig]

    def __init__(self) -> None:
        self._conf = _LoggingConfig()

    # ----------------------------------------------------------------------------------------------
    # Phases of the fuzzer

    def reset(self, max_iterations: int, start_time: datetime) -> None:
        """ Reset the state of the fuzzer """
        self.one_percent_progress = max_iterations / 100
        self.progress = 0
        self.progress_percent = 0
        self.msg = ""
        self.start_time = start_time

    def start(self, iterations: int, start_time: datetime) -> None:
        """ Print the start message of the fuzzer (namely, the start time) """
        self.reset(iterations, start_time)
        if not self._conf.info:
            return
        inform("fuzzer", start_time.strftime('Starting at %H:%M:%S'))

    def start_round(self, round_id: int) -> None:
        """ Update the progress bar for the next fuzzing round """
        if not self._conf.info:
            return

        # Update the progress state
        if STAT.test_cases > self.progress:
            self.progress += self.one_percent_progress
            self.progress_percent += 1
        if STAT.test_cases == 0:
            msg = ""
        else:
            msg = f"\r{STAT.test_cases:<6}({self.progress_percent:>2}%)| Stats: "
            msg += STAT.get_brief()
        self.msg = msg

        # Print the progress bar
        if STAT.test_cases > 0:
            print(f"{self.msg:<{self._msg_width}}", end=self._conf.line_ending, flush=True)
        if self._conf.dbg_timestamp and round_id and round_id % 1000 == 0:
            dbg(
                "fuzzer", f"Time: {datetime.today()} | "
                f" Duration: {(datetime.today() - self.start_time).total_seconds()} seconds")

    def priming(self, num_violations: int) -> None:
        """ Print a message indicating that the fuzzer is in the priming phase """
        if not self._conf.info:
            return
        msg = self.msg + f"> Priming  {num_violations}             "
        print(msg, end=self._conf.line_ending, flush=True)
        self._msg_width = max(self._msg_width, len(msg))

    def nesting_increased(self) -> None:
        """ Print a message indicating that the model's nesting level has been increased """
        if not self._conf.info:
            return
        msg = self.msg + f"> Nest   {CONF.model_max_nesting}         "
        self._msg_width = max(self._msg_width, len(msg))
        print(msg, end=self._conf.line_ending, flush=True)

    def slow_path(self) -> None:
        """ Print a message indicating that the fuzzer has entered the slow path """
        if not self._conf.info:
            return
        msg = self.msg + ">" + " Entering slow path..."
        self._msg_width = max(self._msg_width, len(msg))
        print(msg, end=self._conf.line_ending, flush=True)

    def timeout(self) -> None:
        """ Print a message indicating that the fuzzer has timed out """
        if not self._conf.info:
            return
        inform("fuzzer", "\nTimeout expired")

    def sample_size_increase(self, sample_size: int) -> None:
        """ Print a message indicating that the sample size has been increased """
        if not self._conf.info:
            return
        msg = self.msg + ">" + " Increasing sample size... to " + str(sample_size)
        self._msg_width = max(self._msg_width, len(msg))
        print(msg, end=self._conf.line_ending, flush=True)

    def report_violations(self, violation: Violation) -> None:
        """ Print the detected violations """
        print("\n\n================================ Violations detected ==========================")
        print(violation.full_str())

    def finish(self) -> None:
        """ Print the finish message of the fuzzer (namely, the finish
        time and the duration of the fuzzer) """
        if not self._conf.info:
            return
        now = datetime.today()
        print("")  # new line after the progress bar
        if self._conf.stat:
            print("================================ Statistics ================================"
                  "===\n")
            print(STAT)
        print(f"Duration: {(now - self.start_time).total_seconds():.1f}")
        print(datetime.today().strftime('Finished at %H:%M:%S'))

    def report_model_coverage(self, model: Model) -> None:
        """ Save model coverage """
        if not __debug__:
            return
        if not self._conf.dbg_coverage:
            return
        model.report_coverage("coverage.txt")

    # ----------------------------------------------------------------------------------------------
    # Debugging
    def dbg_dump_traces(self, inputs: List[InputData], htraces: List[HTrace],
                        reference_htraces: List[HTrace], ctraces: List[CTrace]) -> None:
        """ Print the collected traces """
        if not __debug__:
            return
        if not self._conf.dbg_dump_htraces and not self._conf.dbg_dump_ctraces:
            return
        if not htraces:  # might be empty due to tracing errors
            return

        # Optionally trim the output
        if len(inputs) > 100 and not self._conf.dbg_dump_traces_unlimited:
            warning("fuzzer", "Trace output is will be limited to 100 traces")
            inputs = inputs[:100]

        # Replace corrupted traces with the reference traces
        for i, htrace in enumerate(htraces):
            if htrace.is_corrupted_or_ignored() \
               and not reference_htraces[i].is_corrupted_or_ignored():
                htraces[i] = reference_htraces[i]

        print("\n================================ Collected Traces =============================")
        org_debug_state = self._conf.dbg_model
        self._conf.dbg_model = False
        for i, _ in enumerate(inputs):
            print(f"- Input {i}:")
            colors: Tuple[str, ...]
            if self._conf.dbg_dump_ctraces:
                colors = (M_COL, PC_COL, VAL_COL, COL_RESET) if CONF.color else ()
                ctrace_str = ctraces[i].full_str(*colors)
                print(f"  CTr: {ctrace_str} | Hash: {ctraces[i]}")
            if self._conf.dbg_dump_htraces:
                colors = (HTRACE_R1_COL, HTRACE_R2_COL, COL_RESET) if CONF.color else ()
                htrace_str = htraces[i].full_str('    ', *colors)
                print(f"  HTr:\n{htrace_str}")
            if CONF.color and htraces[i].get_max_pfc()[0] > htraces[i].get_max_pfc()[1]:
                print(f"  Feedback: {YELLOW}{htraces[i].get_max_pfc()}{COL_RESET}")
            else:
                print(f"  Feedback: {htraces[i].get_max_pfc()}")
        self._conf.dbg_model = org_debug_state

    def dbg_dump_architectural_traces(self, hardware_regs: List[List[int]],
                                      model_regs: List[List[int]]) -> None:
        """ Print the architectural traces """
        if not __debug__:
            return
        if CONF.fuzzer != "architectural":
            return
        if not self._conf.dbg_dump_htraces and not self._conf.dbg_dump_ctraces:
            return

        print("\n========================== Architectural Traces ==============================")
        for i, _ in enumerate(hardware_regs):
            if i > 100 and not self._conf.dbg_dump_traces_unlimited:
                warning("fuzzer", "Trace output is limited to 100 traces")
                break
            print(f"Input {i}:")
            if self._conf.dbg_dump_ctraces:
                print(f"  Model Registers: {[hex(v) for v in model_regs[i]]}")
            if self._conf.dbg_dump_htraces:
                print(f"  HW Registers:    {[hex(v) for v in hardware_regs[i]]}")

    def dbg_violation(self, violation: Violation, model: Model) -> None:
        """ Print a detailed report of the violation """
        if not __debug__:
            return

        if self._conf.dbg_violation:
            print("================================ Violation Traces =============================")
            hw_classes = violation.get_hw_classes()
            model.load_test_case(violation.test_case_code)
            for hw_class in hw_classes:
                measurement = hw_class.measurements[0]
                print(f"                      ##### Input {measurement.input_id} #####")
                model_debug_state = self._conf.dbg_model, self._conf.dbg_model_print_id
                self._conf.dbg_model = True
                self._conf.dbg_model_print_id = False
                model.trace_test_case([measurement.input_], CONF.model_max_nesting)
                self._conf.dbg_model, self._conf.dbg_model_print_id = model_debug_state
                print("\n\n")

    def dbg_priming_progress(self, input_id: int, current_input_id: int) -> None:
        """ Print a message indicating the progress of the priming phase """
        if not __debug__:
            return
        if not self._conf.dbg_priming:
            return
        print(f"\nPriming #{input_id} in place of #{current_input_id}")

    def dbg_priming_fail(self, input_id: int, current_input_id: int, htrace_to_reproduce: HTrace,
                         new_htrace: HTrace) -> None:
        """ Print a message indicating that the priming phase has failed """
        if not __debug__:
            return
        if not self._conf.dbg_priming:
            return

        print(f"\nPriming failed for input {input_id} in place of {current_input_id}")
        print(f"{'HTrace':64} Original|New")
        print(htrace_to_reproduce.full_pair_str(new_htrace))


class ModelLogger:
    """
    A class that provides logging services for the Model modules. Primarily, this class
    is responsible for printing the debug trace of the model.
    (printed when dbg_model or dbg_violation is set in the config file)
    """

    model_layout: Optional[SandboxLayout] = None

    def __init__(self) -> None:
        self._conf = _LoggingConfig()

    def set_model_layout(self, layout: SandboxLayout) -> None:
        """ Store the layout of the model being debugged """
        self.model_layout = layout

    def dbg_header(self, input_id: int) -> None:
        """ Print the header of the debug information """
        if not __debug__:
            return
        if not self._conf.dbg_model or not self._conf.dbg_model_print_id:
            return

        print(f"\n                     ##### Input {input_id} #####")

    def dbg_mem_access(self, is_store: bool, value: int, address: int, size: int,
                       model: UnicornModel, layout: SandboxLayout) -> None:
        """
        Print debug information about memory access, if debugging is enabled.
        The information includes:
            - Memory address (as an offset from the start of the main actor's data section)
            - Type of access (load or store)
            - Value being read or written

        :param type_: The type of memory access (UC_MEM_READ or UC_MEM_WRITE)
        :param value: The value being read or written
        :param address: The address being accessed
        :param size: The size of the memory access
        :param model: The model being debugged
        :param layout: The layout of the model being debugged
        :return: None
        """
        if not __debug__:
            return
        if not self._conf.dbg_model:
            return

        # Address details
        normalized_address = layout.data_addr_to_offset(address)

        # Value details
        val = value if is_store else int.from_bytes(
            model.emulator.mem_read(address, size), byteorder='little')

        # Build and print the report string
        type_str = "store to" if is_store else "load from"
        if CONF.color:
            msg = f"    > {CYAN}{type_str}{COL_RESET} +0x{normalized_address:x} " \
                  f"{CYAN}value {COL_RESET}0x{val:x}"
        else:
            msg = f"    > {type_str} +0x{normalized_address:x} value 0x{val:x}"

        print(msg)

    def dbg_instruction(self, pc: int, model: UnicornModel, state: ModelExecutionState,
                        speculator: UnicornSpeculator) -> None:
        """
        Print debug information about the current instruction, if debugging is enabled.
        The information includes:
          - Instruction name and operands
          - Current register values
          - Whether the instruction is speculative, and if so, the speculative nesting level
        """
        if not __debug__:
            return
        if not self._conf.dbg_model:
            return

        # Instruction details
        instruction = state.current_instruction
        name = str(instruction)
        code_offset = model.layout.code_addr_to_offset(pc)
        is_exit = state.is_exit_addr(pc)

        # Speculation details
        in_speculation = speculator.in_speculation()
        nesting = speculator.nesting()

        # Build and print the report string
        inst_str = name
        if CONF.color:
            if in_speculation:
                inst_str = YELLOW + inst_str + COL_RESET
            else:
                inst_str = GREEN + inst_str + COL_RESET
        if in_speculation:
            inst_str = f"[transient, nesting = {nesting}] " + inst_str
        inst_str = f"0x{code_offset:<2x}: {inst_str}"
        if is_exit:
            inst_str += " [test_case_exit]"
        print(inst_str)

        # Print the register values
        model.print_registers(oneline=True)

    def dbg_rollback(self, address: int) -> None:
        """ Print a message indicating that the model has rolled back to a specific address """
        if not __debug__:
            return
        if not self._conf.dbg_model:
            return

        assert self.model_layout is not None
        base = self.model_layout.code_start()

        msg = f"ROLLBACK to 0x{address - base:x}"
        if CONF.color:
            msg = YELLOW + msg + COL_RESET
        print(msg)

    def dbg_exception(self, errno: int, descr: str) -> None:
        """ Print a message indicating that an exception has occurred """
        if not __debug__:
            return

        if not self._conf.dbg_model:
            return

        msg = f"EXCEPTION #{errno}: {descr}"
        if CONF.color:
            msg = RED + msg + COL_RESET
        print(msg)


class GeneratorLogger:
    """ A class that provides logging services for the Program Generator module """

    def __init__(self) -> None:
        self._conf = _LoggingConfig()

    def dbg_dump_instruction_pool(self, instructions: List[InstructionSpec]) -> None:
        """
        Print the instruction pool used by the Program Generator, if debugging is enabled.
        The instructions are grouped by category and printed in a human-readable format.
        """
        if not __debug__:
            return
        if not self._conf.dbg_generator or not CONF.is_generation_enabled():
            return

        instructions_by_category: Dict[str, Set[str]] = {i.category: set() for i in instructions}
        for i in instructions:
            instructions_by_category[i.category].add(i.name)
        n_instructions = sum(len(v) for v in instructions_by_category.values())

        dbg("generator", f"Instructions under test {n_instructions}:")
        for k, instruction_list in instructions_by_category.items():
            print("  - " + k + ": " + pformat(sorted(instruction_list), indent=4, compact=True))
        print("")


class ExecutorLogger:
    """ A class that provides logging services for the Executor module """

    def __init__(self) -> None:
        self._conf = _LoggingConfig()

    def dbg_dump_raw_traces(self, htraces: List[HTrace]) -> None:
        """ Print the raw traces collected by the executor """
        if not __debug__:
            return
        if not self._conf.dbg_executor_raw:
            return

        print("Collected raw traces:")
        for input_id, htrace in enumerate(htraces):
            prefix = f"{input_id:03}, "
            print(htrace.full_str(prefix))


class ISALogger:
    """ A class that provides logging services for the isa_spec module """

    def __init__(self) -> None:
        self._conf = _LoggingConfig()

    def dbg_dump_filtering_reason(self, instruction: InstructionSpec, reason: str) -> None:
        """
        Print the reason why a specific instruction was filtered out by the ISA module,
        if debugging is enabled.
        """
        if not __debug__:
            return
        if not self._conf.dbg_isa_filter or not CONF.is_generation_enabled():
            return

        dbg("isa_spec", f"{instruction.name} ({instruction.category}) filtered out: {reason}")


================================================
FILE: rvzr/model.py
================================================
"""
File: Model Interface (Backend- and ISA-independent)
      A model is a module that can execute a test case according to a contract
      and collect contract traces.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from abc import ABC, abstractmethod
from typing import List, Tuple, TYPE_CHECKING, Any

from .traces import CTrace
from .tc_components.test_case_data import InputData, InputTaint

if TYPE_CHECKING:
    from .sandbox import SandboxLayout, BaseAddrTuple
    from .tc_components.test_case_code import TestCaseProgram


class Model(ABC):
    """
    Abstract interface for all contract models.
    The specific implementation depends on the selected backend and the target ISA.
    """

    layout: SandboxLayout
    """ The memory layout of the most-recently loaded test case within the model """

    is_speculative: bool
    """ Indicates whether the model implements any form of speculative execution """

    _enable_mismatch_check_mode: bool = False
    """ mismatch_check_mode: If True, the model will return GPR values instead of
    contract traces, which is used to check for mismatches between the model and the executor """

    @abstractmethod
    def __init__(self,
                 bases: BaseAddrTuple,
                 *args: Any,
                 enable_mismatch_check_mode: bool = False) -> None:
        pass

    @abstractmethod
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Load a test case into the model, which implies allocating memory for the code
        and data, initializing permissions, and doing other necessary setup.

        This method *must* be called before calling `trace_test_case`.
        """

    @abstractmethod
    def trace_test_case(self, inputs: List[InputData], nesting: int) -> List[CTrace]:
        """
        Execute a previously loaded test case in the model with the given inputs,
        and collect the traces for each execution (i.e., one trace per input).
        """

    @abstractmethod
    def trace_test_case_with_taints(self, inputs: List[InputData],
                                    nesting: int) -> Tuple[List[CTrace], List[InputTaint]]:
        """
        Execute a previously loaded test case in the model with the given inputs,
        and collect the traces for each execution (i.e., one trace per input).
        While collecting the traces, also collect the taints for each input.
        """

    @abstractmethod
    def report_coverage(self, path: str) -> None:
        """
        Report the coverage of the fuzzing campaign w.r.t. the model, and store the report
        in the given file path.
        """


class DummyModel(Model):
    """
    Dummy implementation of the Model interface that does nothing. All traces produced by
    this model are empty, and thus all inputs form the same equivalence class.

    This model is useful for testing purposes or for cases where it's necessary to
    run the fuzzer without a model (e.g., for standalone hardware tracing).
    """
    is_speculative: bool = False

    def __init__(self,
                 bases: BaseAddrTuple,
                 *args: Any,
                 enable_mismatch_check_mode: bool = False) -> None:
        pass

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        pass

    def trace_test_case(self, inputs: List[InputData], nesting: int) -> List[CTrace]:
        return [CTrace.empty_trace() for _ in inputs]

    def trace_test_case_with_taints(self, inputs: List[InputData],
                                    nesting: int) -> Tuple[List[CTrace], List[InputTaint]]:
        taints = [InputTaint() for _ in inputs]
        traces = [CTrace.empty_trace() for _ in inputs]
        return traces, taints

    def report_coverage(self, path: str) -> None:
        pass


================================================
FILE: rvzr/model_dynamorio/Makefile
================================================
mkfile_path = $(abspath $(lastword $(MAKEFILE_LIST)))
current_dir = $(dir $(mkfile_path))

dr_path := $(HOME)/.local/dynamorio/
model_path := $(HOME)/.local/dynamorio/model/

release := 11.2.0

CMAKE_FLAGS := -DCMAKE_EXPORT_COMPILE_COMMANDS=ON

.PHONY: all download_dr backend adapter clean-backend clean-adapter clean

all: download_dr backend adapter

download_dr: $(dr_path)/drrun
	@echo "DynamoRIO is downloaded and ready to use."

$(dr_path)/drrun:
	mkdir -p $(dr_path)
	wget https://github.com/DynamoRIO/dynamorio/releases/download/release_$(release)/DynamoRIO-Linux-$(release).tar.gz -O $(dr_path)/DynamoRIO-Linux-$(release).tar.gz
	tar xf $(dr_path)/DynamoRIO-Linux-$(release).tar.gz -C $(dr_path)
	rm $(dr_path)/DynamoRIO-Linux-$(release).tar.gz
	echo "#!/usr/bin/env bash" > $(dr_path)/drrun
	echo '$(dr_path)/DynamoRIO-Linux-$(release)/bin64/drrun -disable_traces	$$@' >> $(dr_path)/drrun
	chmod +x $(dr_path)/drrun

backend:
	mkdir -p $(current_dir)/backend/build
	cd $(current_dir)/backend/build && cmake $(CMAKE_FLAGS) -DDynamoRIO_DIR=$(dr_path)/DynamoRIO-Linux-$(release)/cmake -D CMAKE_BUILD_TYPE=Debug  $(current_dir)/backend
	make -C $(current_dir)/backend/build
	cp $(current_dir)/backend/build/libdr_model.so $(dr_path)

adapter:
	mkdir -p $(current_dir)/adapter/build
	cd $(current_dir)/adapter/build && cmake $(CMAKE_FLAGS) $(current_dir)/adapter
	make -C $(current_dir)/adapter/build
	make -C $(current_dir)/adapter/build install

clean-backend:
	rm -rf $(current_dir)/backend/build

clean-adapter:
	rm -rf $(current_dir)/adapter/build

clean:  clean-backend clean-adapter

# * build dr_model

# ```
# cd adapters
# make example
# drrun -c ~/.local/dr_model/libdr_model.so --tracer ct --disable-normalization -- ./example 2
# ```


================================================
FILE: rvzr/model_dynamorio/__init__.py
================================================


================================================
FILE: rvzr/model_dynamorio/adapter/.clang-format
================================================
ColumnLimit: 100
IndentWidth: 4
BreakBeforeBraces: Linux
AllowShortIfStatementsOnASingleLine: false
AlignConsecutiveMacros:
  Enabled: true
  AcrossEmptyLines: false
  AcrossComments: false


================================================
FILE: rvzr/model_dynamorio/adapter/.clang-tidy
================================================
Checks: >
    -*,
    bugprone-*,
    cert-*,
    clang-analyzer-*,
    llvm-*,
    misc-*,
    modernize-*,
    performance-*,
    portability-*,
    readability-*,
    -clang-analyzer-security.insecureAPI.DeprecatedOrUnsafeBufferHandling,
    -misc-include-cleaner,
    -cert-err33-c,
    -llvm-header-guard,
    -clang-analyzer-unix.StdCLibraryFunctions,
    -clang-analyzer-optin.taint.TaintedAlloc,
    -clang-analyzer-security.MmapWriteExec

# Turn all the warnings from the checks above into errors.
WarningsAsErrors: "*"


================================================
FILE: rvzr/model_dynamorio/adapter/CMakeLists.txt
================================================
cmake_minimum_required(VERSION 3.10)
project(adapter C ASM)

# Set compile flags
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -ggdb")

# Define source files
set(SRC_FILES
    main.c
    parser.c
    sandbox.c
)

set(SRC_FILES_ASM
    test_case_entry.S
)

# Create executable
add_executable(adapter ${SRC_FILES} ${SRC_FILES_ASM})
target_include_directories(adapter PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
target_link_libraries(adapter rt)

# Install target
install(TARGETS adapter
        DESTINATION $ENV{HOME}/.local/dynamorio)


================================================
FILE: rvzr/model_dynamorio/adapter/main.c
================================================
///
/// File: Module responsible for loading binary test cases produced by
///       the Revizor generator, and executing them in a sandboxed environment
///       that mirrors the one used by x86 executor.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <assert.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>

#include "parser.h"
#include "rcbf.h"
#include "rdbf.h"
#include "sandbox.h"

static const char *rcbf_file = NULL;
static const char *rdbf_file = NULL;
static const char *bases_file = NULL;

// Defined in test_case_entry.asm
void test_case_entry_outer(uint8_t *main_area_base, uint8_t *code_base);

static int parse_args(int argc, char const *argv[])
{
    // Check usage
    if (argc != 4) {
        printf("Usage: %s <RCBF file> <RDBF file> <bases_file>\n", argv[0]);
        return -1;
    }
    rcbf_file = argv[1];
    rdbf_file = argv[2];
    bases_file = argv[3];

    // Check if files exist
    if (access(rcbf_file, F_OK) == -1) {
        fprintf(stderr, "ERROR: RCBF file %s does not exist\n", rcbf_file);
        return -1;
    }
    if (access(rdbf_file, F_OK) == -1) {
        fprintf(stderr, "ERROR: RDBF file %s does not exist\n", rdbf_file);
        return -1;
    }
    if (access(bases_file, F_OK) == -1) {
        fprintf(stderr, "ERROR: Bases file %s does not exist\n", bases_file);
        return -1;
    }

    return 0;
}

/// @brief Free all resources allocated by the module
/// @param rcbf Allocated RCBF structure
/// @param rdbf Allocated RDBF structure
/// @return void
static void cleanup(rcbf_t *rcbf, rdbf_t *rdbf)
{
    free_rcbf(rcbf);
    free_rdbf(rdbf);
}

int main(int argc, char const *argv[])
{
    // Parse CLI arguments
    if (parse_args(argc, argv) != 0) {
        return -1;
    }

    // Parse input files
    rcbf_t *rcbf_data = parse_rcbf(rcbf_file);
    rdbf_t *rdbf_data = parse_rdbf(rdbf_file);
    if (rcbf_data->header.n_actors != rdbf_data->header.n_actors) {
        fprintf(stderr, "ERROR: RCBF and RDBF files have different number of actors\n");
        cleanup(rcbf_data, rdbf_data);
        return -1;
    }

    // Allocate memory for the sandbox and load code
    if (allocate_sandbox(rcbf_data->header.n_actors) != 0) {
        fprintf(stderr, "ERROR: Failed to allocate memory for the sandbox\n");
        cleanup(rcbf_data, rdbf_data);
        return -1;
    }
    if (load_code_in_sandbox(rcbf_data) != 0) {
        fprintf(stderr, "ERROR: Failed to load code into the sandbox\n");
        cleanup(rcbf_data, rdbf_data);
        return -1;
    }

    // Communicate sandbox base addresses to the python model, in binary format
    sandbox_t *sandbox = get_sandbox();
    FILE *bases_fp = fopen(bases_file, "wb");
    if (bases_fp == NULL) {
        perror("fopen:bases_file");
        cleanup(rcbf_data, rdbf_data);
        return -1;
    }
    fwrite((const void *)&sandbox->code, sizeof(uint8_t *), 1, bases_fp);
    fwrite((const void *)&sandbox->data, sizeof(uint8_t *), 1, bases_fp);
    fflush(bases_fp);
    fclose(bases_fp);

    // Load data into the sandbox and execute the test case
    for (int i = 0; i < rdbf_data->header.n_inputs; i++) {
        if (load_data_in_sandbox(rdbf_data, i) != 0) {
            fprintf(stderr, "ERROR: Failed to load data into the sandbox\n");
            cleanup(rcbf_data, rdbf_data);
            return -1;
        }
        sandbox_t *sandbox = get_sandbox();
        test_case_entry_outer(&sandbox->data->main_area[0], &sandbox->code->code[0]);
    }

    cleanup(rcbf_data, rdbf_data);
    return 0;
}


================================================
FILE: rvzr/model_dynamorio/adapter/parser.c
================================================
///
/// File: RCBF and RDBF parsing functions for the DynamoRIO backend adapter
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <stdio.h>
#include <stdlib.h>

#include "rcbf.h"
#include "rdbf.h"
#include "sandbox_const.h"

/// @brief Parse the file in RCBF format and return
///        pointer to the parsed data
/// @param filename The name of the file to parse
/// @return Pointer to the parsed data
rcbf_t *parse_rcbf(const char *filename)
{
    // Open the file in binary mode
    FILE *rdbf_fp = fopen(filename, "rb");
    if (rdbf_fp == NULL) {
        perror("fopen:parse_rcbf");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the RCBF structure
    rcbf_t *rcbf = (rcbf_t *)malloc(sizeof(rcbf_t));
    if (rcbf == NULL) {
        perror("malloc:rcbf");
        exit(EXIT_FAILURE);
    }

    // Read the header
    if (fread(&rcbf->header, sizeof(rcbf_header_t), 1, rdbf_fp) != 1) {
        perror("fread:rcbf->header");
        exit(EXIT_FAILURE);
    }
    uint64_t n_actors = rcbf->header.n_actors;
    if (n_actors <= 0 || n_actors > MAX_ACTORS) {
        fprintf(stderr, "ERROR: invalid number of actors in the RCBF file\n");
        exit(EXIT_FAILURE);
    }
    uint64_t n_symbols = rcbf->header.n_symbols;
    if (n_symbols <= 0) {
        fprintf(stderr, "ERROR: invalid number of symbols in the RCBF file\n");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the actor table and read it
    rcbf->actor_table = (actor_metadata_t *)malloc(n_actors * sizeof(actor_metadata_t));
    if (rcbf->actor_table == NULL) {
        perror("malloc:rcbf->actor_table");
        exit(EXIT_FAILURE);
    }
    if (fread(rcbf->actor_table, sizeof(actor_metadata_t), n_actors, rdbf_fp) != n_actors) {
        perror("fread:rcbf->actor_table");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the symbol table and read it
    rcbf->symbol_table = (symbol_entry_t *)malloc(n_symbols * sizeof(symbol_entry_t));
    if (rcbf->symbol_table == NULL) {
        perror("malloc:rcbf->symbol_table");
        exit(EXIT_FAILURE);
    }
    if (fread(rcbf->symbol_table, sizeof(symbol_entry_t), n_symbols, rdbf_fp) != n_symbols) {
        perror("fread:rcbf->symbol_table");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the section metadata and read it
    rcbf->section_metadata =
        (code_section_metadata_t *)malloc(n_actors * sizeof(code_section_metadata_t));
    if (rcbf->section_metadata == NULL) {
        perror("malloc:rcbf->section_metadata");
        exit(EXIT_FAILURE);
    }
    if (fread(rcbf->section_metadata, sizeof(code_section_metadata_t), n_actors, rdbf_fp) !=
        n_actors) {
        perror("fread:rcbf->section_metadata");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the code sections and read it
    rcbf->sections = (rcbf_code_section_t *)malloc(n_actors * sizeof(rcbf_code_section_t));
    if (rcbf->sections == NULL) {
        perror("malloc:rcbf->sections");
        exit(EXIT_FAILURE);
    }
    for (uint64_t i = 0; i < n_actors; i++) {
        if (fread(rcbf->sections[i].code, 1, rcbf->section_metadata[i].size, rdbf_fp) !=
            rcbf->section_metadata[i].size) {
            perror("fread:rcbf->sections");
            exit(EXIT_FAILURE);
        }
    }

    // Close the file
    fclose(rdbf_fp);

    return rcbf;
}

/// @brief Free the memory allocated for the RCBF structure
/// @param rcbf The RCBF structure to free
void free_rcbf(rcbf_t *rcbf)
{
    free(rcbf->actor_table);
    free(rcbf->symbol_table);
    free(rcbf->section_metadata);
    free(rcbf->sections);
    free(rcbf);
}

/// @brief Parse the file in RDBF format and return pointer to the parsed data
/// @param filename The name of the file to parse
/// @return Pointer to the parsed data
rdbf_t *parse_rdbf(const char *filename)
{
    // Open the file in binary mode
    FILE *rdbf_fp = fopen(filename, "rb");
    if (rdbf_fp == NULL) {
        perror("fopen:parse_rdbf");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the RDBF structure
    rdbf_t *rdbf = (rdbf_t *)malloc(sizeof(rdbf_t));
    if (rdbf == NULL) {
        perror("malloc:rdbf");
        exit(EXIT_FAILURE);
    }

    // Read the header
    if (fread(&rdbf->header, sizeof(rdbf_header_t), 1, rdbf_fp) != 1) {
        perror("fread:rdbf->header");
        exit(EXIT_FAILURE);
    }
    uint64_t n_actors = rdbf->header.n_actors;
    uint64_t n_inputs = rdbf->header.n_inputs;

    // Allocate memory for the data section metadata and read it
    rdbf->metadata = (data_section_metadata_t *)malloc(n_actors * sizeof(data_section_metadata_t));
    if (rdbf->metadata == NULL) {
        perror("malloc:rdbf->metadata");
        exit(EXIT_FAILURE);
    }
    if (fread(rdbf->metadata, sizeof(data_section_metadata_t), n_actors, rdbf_fp) != n_actors) {
        perror("fread:rdbf->metadata");
        exit(EXIT_FAILURE);
    }

    // Allocate memory for the data sections and read them
    uint64_t data_size = n_inputs * n_actors * sizeof(rdbf_data_section_t);
    rdbf->data = (rdbf_data_section_t *)malloc(data_size);
    if (rdbf->data == NULL) {
        perror("malloc:rdbf->data");
        exit(EXIT_FAILURE);
    }
    if (fread(rdbf->data, 1, data_size, rdbf_fp) != data_size) {
        perror("fread:rdbf->data");
        exit(EXIT_FAILURE);
    }

    // By this point the whole file should be read
    if (fgetc(rdbf_fp) != EOF) {
        fprintf(stderr, "ERROR: unexpected file format of the RDBF file\n");
        exit(EXIT_FAILURE);
    }

    // Close the file
    fclose(rdbf_fp);

    return rdbf;
}

/// @brief Free the memory allocated for the RDBF structure
/// @param rdbf The RDBF structure to free
void free_rdbf(rdbf_t *rdbf)
{
    free(rdbf->metadata);
    free(rdbf->data);
    free(rdbf);
}


================================================
FILE: rvzr/model_dynamorio/adapter/parser.h
================================================
/// File: Interface to the RCBF/RDBF parser
///
/// Copyright (C) Microsoft Corporation
/// SPDX-License-Identifier: MIT

#ifndef PARSER_H
#define PARSER_H

#include "rcbf.h"
#include "rdbf.h"

rcbf_t *parse_rcbf(const char *filename);
void free_rcbf(rcbf_t *rcbf);

rdbf_t *parse_rdbf(const char *filename);
void free_rdbf(rdbf_t *rdbf);

#endif // PARSER_H


================================================
FILE: rvzr/model_dynamorio/adapter/rcbf.h
================================================
/// File: Representation of a RCBF binary
/// (see docs/devel/binary-formats.md for format description)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef RCBF_H
#define RCBF_H

#include <stdbool.h>
#include <stddef.h>
#include <stdint.h>

enum {
    MODE_HOST = 0,
    MODE_GUEST = 1,
};

enum {
    PL_KERNEL = 0,
    PL_USER = 1,
};

#define MAX_SECTION_SIZE 4096

typedef struct {
    uint64_t n_actors;
    uint64_t n_symbols;
} rcbf_header_t;

typedef struct {
    uint64_t actor_id;
    uint64_t mode;
    uint64_t pl;
    uint64_t data_permissions;
    uint64_t data_ept_properties;
    uint64_t code_permissions;
} actor_metadata_t;

typedef struct {
    uint64_t section_id;
    uint64_t offset;
    uint64_t symbol_id;
    uint64_t args;
} symbol_entry_t;

typedef struct {
    uint64_t section_id;
    uint64_t size;
    uint64_t reserved;
} code_section_metadata_t;

typedef struct {
    char code[MAX_SECTION_SIZE];
} rcbf_code_section_t;

typedef struct {
    rcbf_header_t header;
    actor_metadata_t *actor_table;
    symbol_entry_t *symbol_table;
    code_section_metadata_t *section_metadata;
    rcbf_code_section_t *sections;
} rcbf_t;

extern rcbf_t *test_case_code;

#endif // RCBF_H


================================================
FILE: rvzr/model_dynamorio/adapter/rdbf.h
================================================
/// File: Representation of a RDBF binary
/// (see docs/devel/binary-formats.md for format description)
///
/// Copyright (C) Microsoft Corporation
/// SPDX-License-Identifier: MIT

#ifndef RDBF_H
#define RDBF_H

#include <stdint.h>

#define RDBF_AREA_SIZE 4096

typedef struct {
    uint64_t n_actors;
    uint64_t n_inputs;
} rdbf_header_t;

typedef struct {
    uint64_t size;
    uint64_t reserved;
} data_section_metadata_t;

typedef struct {
    char main_area[RDBF_AREA_SIZE];
    char faulty_area[RDBF_AREA_SIZE];
    char reg_init_region[RDBF_AREA_SIZE];
} rdbf_data_section_t;

typedef struct {
    rdbf_header_t header;
    data_section_metadata_t *metadata;
    rdbf_data_section_t *data;
} rdbf_t;

extern rdbf_t *input_sequence;

#endif // RDBF_H


================================================
FILE: rvzr/model_dynamorio/adapter/sandbox.c
================================================
/// File: Allocation and management of the sandbox memory for test cases
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <stdlib.h>
#include <string.h>
#include <sys/mman.h>

#include "rcbf.h"
#include "rdbf.h"
#include "sandbox.h"

static sandbox_t *sandbox;
static const int nop_opcode = 0x90;
static const int ret_opcode = 0xc3;

static const int eflags_must_clear_mask = 2263;
static const int eflags_must_set_mask = 2;

// Defined in test_case_entry.asm
void test_case_entry(uint8_t *main_area_base);

/// @brief Load a test case code into the sandbox
/// @param rcbf_data Parsed RCBF data
/// @return 0 on success, -1 on failure
int load_code_in_sandbox(rcbf_t *rcbf_data)
{
    for (uint64_t section_id = 0; section_id < rcbf_data->header.n_actors; section_id++) {
        code_section_t *code_section = &sandbox->code[section_id];
        // printf("Loading code section %lx into sandbox %llx\n", section_id, code_section);

        // Copy the code into the sandbox
        int code_size = (int)rcbf_data->section_metadata[section_id].size;
        memcpy(code_section->code, rcbf_data->sections[section_id].code, code_size);

        // The end of the code section in the main area is the test case exit point;
        // We insert a RETQ instruction to return to the caller
        if (section_id == 0) {
            code_section->code[code_size] = ret_opcode;
            code_size++;
        }

        // Initialize the remaining space with NOPs
        int uninitialized_size = MAX_EXPANDED_SECTION_SIZE - code_size;
        memset(code_section->code + code_size, nop_opcode, uninitialized_size);
        memset(code_section->unused, nop_opcode, MACRO_AREA_SIZE);
    }

    return 0;
}

/// @brief Load a test case data into the sandbox
/// @param rdbf_data Parsed RDBF data
/// @param input_id Index of the input to load from the RDBF data
/// @return 0 on success, -1 on failure
int load_data_in_sandbox(rdbf_t *rdbf_data, int input_id)
{
    rdbf_data_section_t *data = &rdbf_data->data[input_id];
    for (uint64_t section_id = 0; section_id < rdbf_data->header.n_actors; section_id++) {
        data_section_t *data_section = &sandbox->data[section_id];

        // Zero out underflow and overflow pads
        memset(data_section->macro_stack, 0, MACRO_STACK_SIZE);
        memset(data_section->underflow_pad, 0, UNDERFLOW_PAD_SIZE);
        memset(data_section->overflow_pad, 0, OVERFLOW_PAD_SIZE);

        // Copy the data into the sandbox
        memcpy(data_section->main_area, data[section_id].main_area, MAIN_AREA_SIZE);
        memcpy(data_section->faulty_area, data[section_id].faulty_area, FAULTY_AREA_SIZE);
        memcpy(data_section->reg_init_area, data[section_id].reg_init_region, REG_INIT_AREA_SIZE);

        // Fixup the EFLAGS init value to ensure we don't set invalid flags
        uint64_t eflags_value = ((uint64_t *)data_section->reg_init_area)[EFLAGS_INIT_ID];
        eflags_value = (eflags_value & eflags_must_clear_mask) | eflags_must_set_mask;
        ((uint64_t *)data_section->reg_init_area)[EFLAGS_INIT_ID] = eflags_value;
    }

    return 0;
}

/// @brief Accessor for the sandbox
/// @return Pointer to the sandbox
sandbox_t *get_sandbox() { return sandbox; }

// =================================================================================================
// Constructor and destructor
// =================================================================================================
/// @brief Allocate memory for the sandbox
/// @param n_actors Number of actors in the test case
/// @return -1 on failure, 0 on success
int allocate_sandbox(uint64_t n_actors)
{
    sandbox = (sandbox_t *)malloc(sizeof(sandbox_t));
    if (sandbox == NULL) {
        return -1;
    }

    // Allocate memory for the data and code sections, with page alignment
    sandbox->data = (data_section_t *)aligned_alloc(PAGE_SIZE, n_actors * sizeof(data_section_t));
    if (sandbox->data == NULL) {
        free(sandbox);
        return -1;
    }

    sandbox->code = (code_section_t *) test_case_entry;
    mprotect(sandbox->code, n_actors * sizeof(code_section_t), PROT_READ | PROT_WRITE | PROT_EXEC);

    return 0;
}

/// @brief Free the memory allocated for the sandbox
void free_sandbox()
{
    free(sandbox->data);
    free(sandbox);
}


================================================
FILE: rvzr/model_dynamorio/adapter/sandbox.h
================================================
/// File: Sandbox layout
/// (see docs/sandbox.md for layout description)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef SANDBOX_H
#define SANDBOX_H

#include <stdint.h>

#include "rcbf.h"
#include "rdbf.h"
#include "sandbox_const.h"

// =================================================================================================
// Data sections
// =================================================================================================

// IMPORTANT! This structure must match the layout in rvzr/executor_km/include/sandbox_manager.h
typedef struct {
    uint8_t macro_stack[MACRO_STACK_SIZE];     // stack for storing registers when calling macros
    uint8_t underflow_pad[UNDERFLOW_PAD_SIZE]; // zero-initialized region for accidental underflows
    uint8_t main_area[MAIN_AREA_SIZE];         // first input page; does not cause faults
    uint8_t faulty_area[FAULTY_AREA_SIZE];     // second input page; causes a (configurable) fault
    uint8_t reg_init_area[REG_INIT_AREA_SIZE]; // region for initializing registers
    uint8_t overflow_pad[OVERFLOW_PAD_SIZE];   // zero-initialized region for accidental overflows
} __attribute__((packed)) data_section_t;

// =================================================================================================
// Code sections
// =================================================================================================

// IMPORTANT! This structure must match the layout in rvzr/executor_km/include/sandbox_manager.h
typedef struct {
    uint8_t code[MAX_EXPANDED_SECTION_SIZE];
    uint8_t unused[MACRO_AREA_SIZE]; // unused; mirrors the macro area in sandbox_manager.h
} __attribute__((packed)) code_section_t;

_Static_assert(MAX_ACTORS * sizeof(code_section_t) == (unsigned long)TEST_CASE_MAX_SIZE,
               "Invalid value of TEST_CASE_MAX_SIZE");

// =================================================================================================
// sandbox_t
// =================================================================================================
typedef struct {
    data_section_t *data;
    code_section_t *code;
} sandbox_t;

// =================================================================================================
// Functions
// =================================================================================================
int load_code_in_sandbox(rcbf_t *rcbf_data);
int load_data_in_sandbox(rdbf_t *rdbf_data, int input_id);
sandbox_t *get_sandbox();
int allocate_sandbox(uint64_t n_actors);
void free_sandbox();

#endif // SANDBOX_H


================================================
FILE: rvzr/model_dynamorio/adapter/sandbox_const.h
================================================
/// File: Constants for the sandbox layout
/// (see docs/sandbox.md for layout description)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#ifndef SANDBOX_CONST_H
#define SANDBOX_CONST_H

#define PAGE_SIZE 4096U

// layout of code_section_t
#define MACRO_STACK_SIZE   64
#define UNDERFLOW_PAD_SIZE (PAGE_SIZE - MACRO_STACK_SIZE)
#define MAIN_AREA_SIZE     PAGE_SIZE
#define FAULTY_AREA_SIZE   PAGE_SIZE
#define REG_INIT_AREA_SIZE 320 // 8 64-bit GPRs + 8 256-bit YMMs
#define OVERFLOW_PAD_SIZE  (PAGE_SIZE - REG_INIT_AREA_SIZE)

#define REG_INIT_AREA_SIZE_ALIGNED PAGE_SIZE
#define STACK_OFFSET               (MAIN_AREA_SIZE - 8)
#define REG_INIT_OFFSET            (MAIN_AREA_SIZE + FAULTY_AREA_SIZE)
#define SIMD_INIT_OFFSET           (REG_INIT_OFFSET + 64)

#define GPR_SIZE       8
#define EFLAGS_INIT_ID 6
#define RSP_INIT_ID    7

// layout of code_section_t
#define MAX_ACTORS                16U
#define MAX_EXPANDED_SECTION_SIZE (PAGE_SIZE * 2)
#define MACRO_AREA_SIZE           (PAGE_SIZE)
#define TEST_CASE_MAX_SIZE        (MAX_ACTORS * (MAX_EXPANDED_SECTION_SIZE + MACRO_AREA_SIZE))

#endif // SANDBOX_CONST_H


================================================
FILE: rvzr/model_dynamorio/adapter/test_case_entry.S
================================================
.intel_syntax noprefix

#include "sandbox_const.h"
#define xstr(s) _str(s)
#define _str(s) str(s)
#define str(s)  #s

// =================================================================================================
.text

/// @brief Placeholder for the test case code; This will be dynamically populated at runtime
///        by sandbox.c
///        At compile time, a zero-filled area of size TEST_CASE_MAX_SIZE is reserved here.
/// r15: Address of test case code
.global test_case_entry
.align PAGE_SIZE
test_case_entry:
    .rept TEST_CASE_MAX_SIZE
    .byte 0
    .endr


/// @brief Outer wrapper to set up registers and FLAGS
///        See docs/devel/registers.md for the explanation of the initialized registers
/// rdi: Base address of sandbox main_area
/// rsi: Base address of test case code
.global test_case_entry_outer
.align PAGE_SIZE
test_case_entry_outer:
    pushfq
    push rbx
    push rcx
    push rdx
    push r14
    push r15
    push rsp

    // Save arguments
    mov r14, rdi
    mov r15, rsi

    // Initialize FLAGS
    mov rax, qword ptr [r14 + REG_INIT_OFFSET + EFLAGS_INIT_ID * GPR_SIZE]
    push rax
    popfq

    // Stack pointer
    // push rsp
    // mov rax, qword ptr [r14 + xstr(REG_INIT_OFFSET + RSP_INIT_ID * GPR_SIZE)]
    // mov rsp, rax

    // Initialize registers
    mov rax, qword ptr [r14 + REG_INIT_OFFSET + 0x00]
    mov rbx, qword ptr [r14 + REG_INIT_OFFSET + 0x08]
    mov rcx, qword ptr [r14 + REG_INIT_OFFSET + 0x10]
    mov rdx, qword ptr [r14 + REG_INIT_OFFSET + 0x18]
    mov rsi, qword ptr [r14 + REG_INIT_OFFSET + 0x20]
    mov rdi, qword ptr [r14 + REG_INIT_OFFSET + 0x28]

    // Initialize MMX registers
    movq mm0, qword ptr [r14 + SIMD_INIT_OFFSET + 0x00]
    movq mm1, qword ptr [r14 + SIMD_INIT_OFFSET + 0x08]
    movq mm2, qword ptr [r14 + SIMD_INIT_OFFSET + 0x10]
    movq mm3, qword ptr [r14 + SIMD_INIT_OFFSET + 0x18]
    movq mm4, qword ptr [r14 + SIMD_INIT_OFFSET + 0x20]
    movq mm5, qword ptr [r14 + SIMD_INIT_OFFSET + 0x28]
    movq mm6, qword ptr [r14 + SIMD_INIT_OFFSET + 0x30]
    movq mm7, qword ptr [r14 + SIMD_INIT_OFFSET + 0x38]

    // Initialize YMM registers (overlap with MMX init values is intentional)
    vmovdqa ymm0, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0x00]
    vmovdqa ymm1, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0x20]
    vmovdqa ymm2, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0x40]
    vmovdqa ymm3, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0x60]
    vmovdqa ymm4, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0x80]
    vmovdqa ymm5, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0xa0]
    vmovdqa ymm6, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0xc0]
    vmovdqa ymm7, ymmword ptr [r14 + SIMD_INIT_OFFSET + 0xe0]

    call r15

    pop rsp
    pop r15
    pop r14
    pop rdx
    pop rcx
    pop rbx
    popfq

    ret


================================================
FILE: rvzr/model_dynamorio/backend/.clang-format
================================================
ColumnLimit: 100
IndentWidth: 4
BreakBeforeBraces: Linux
AllowShortIfStatementsOnASingleLine: false
AlignConsecutiveMacros:
  Enabled: true
  AcrossEmptyLines: false
  AcrossComments: false


================================================
FILE: rvzr/model_dynamorio/backend/.clang-tidy
================================================
# Reasoning behind excluding some checks:
# - `misc-include-cleaner`: This is incompatible with the DR headers, where dr_api.h is
#   expected to be included in all source files.
# - `modernize-use-trailing-return-type`: This style diverges from the rest of the code base
#   (e.g., the source of `executor_km`), so it is excluded for uniformity.
# - `readability-braces-around-statements`: This style diverges from the rest of the code base
#   (e.g., the source of `executor_km`), so it is excluded for uniformity.
# - `cppcoreguidelines-pro-type-vararg`: Incompatible with the DR API, such as dr_printf
# - `cppcoreguidelines-pro-type-union-access`: Incompatible with dr_mcontext_t
# - `cppcoreguidelines-pro-type-cstyle-cast`: C-style casts are necessary for DR API
# - `coreguidelines-non-private-member-variables-in-classes`: Accessors make code unreasonably verbose
# - `cppcoreguidelines-non-private-member-variables-in-classes`: Alias of the above
# - `llvm-header-guard`: Checks for "LLVM-style" include guards, we want to use #pragma once instead
# - `modernize-use-using`: This style diverges from the rest of the code base
# - `readability-convert-member-functions-to-static`: This makes code less uniform with the rest of the code base
# - `bugprone-easily-swappable-parameters`: DR has many C APIs, and this check causes many false positives
# - `performance-enum-size`: The enum size in the backend is often dictated by the serialization formats, and it causes false positives on this check
# - `cppcoreguidelines-avoid-magic-numbers`: Duplicate of readability-magic-numbers; excluded for consistency
Checks: >
    -*,
    bugprone-*,
    cppcoreguidelines-*,
    llvm-*,
    misc-*,
    modernize-*,
    performance-*,
    readability-*,
    -misc-include-cleaner,
    -misc-use-anonymous-namespace,
    -modernize-use-trailing-return-type,
    -readability-braces-around-statements,
    -cppcoreguidelines-pro-type-vararg,
    -cppcoreguidelines-pro-type-union-access,
    -cppcoreguidelines-pro-type-reinterpret-cast,
    -cppcoreguidelines-pro-type-cstyle-cast,
    -performance-no-int-to-ptr,
    -misc-non-private-member-variables-in-classes,
    -cppcoreguidelines-non-private-member-variables-in-classes,
    -llvm-header-guard,
    -modernize-use-using,
    -readability-convert-member-functions-to-static,
    -bugprone-easily-swappable-parameters,
    -performance-enum-size,
    -cppcoreguidelines-avoid-magic-numbers

# Turn all the warnings from the checks above into errors.
WarningsAsErrors: "*"

HeaderFilterRegex: "^backend/include/.*$"

CheckOptions:
    - key: readability-identifier-length.IgnoredVariableNames
      value: "pc|mc|bb|dc|it"
    - key: readability-identifier-length.IgnoredParameterNames
      value: "pc|mc|bb|dc|it"
    - key: bugprone-easily-swappable-parameters.IgnoredParameterNames
      value: '"";drcontext;wrapctx;;user_data;xflags;max_nesting_'
    - key: readability-magic-numbers.IgnoredIntegerValues
      value: '0;1;2;4;8;-1;-0x1ULL'


================================================
FILE: rvzr/model_dynamorio/backend/CMakeLists.txt
================================================
cmake_minimum_required(VERSION 3.13)

project(dr_model)

set(CMAKE_CXX_STANDARD 17)
set(CMAKE_CXX_STANDARD_REQUIRED TRUE)
set(CMAKE_EXPORT_COMPILE_COMMANDS ON)

# add all C++ files in the current directory
file(GLOB MAIN_SOURCES "*.cpp")
file(GLOB TRACERS "tracers/*.cpp")
file(GLOB SPECULATORS "speculators/*.cpp")
add_library(dr_model SHARED ${MAIN_SOURCES} ${TRACERS} ${SPECULATORS})

# add `include` directory to the include path
target_include_directories(dr_model PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/include)

find_package(DynamoRIO)
if (NOT DynamoRIO_FOUND)
    message(FATAL_ERROR "DynamoRIO package required to build")
endif(NOT DynamoRIO_FOUND)

configure_DynamoRIO_client(dr_model)
use_DynamoRIO_extension(dr_model drmgr)
use_DynamoRIO_extension(dr_model drreg)
use_DynamoRIO_extension(dr_model drutil)
use_DynamoRIO_extension(dr_model drx)
use_DynamoRIO_extension(dr_model drwrap)
use_DynamoRIO_extension(dr_model drsyms)

# Ensure C++17 standard is preserved after DynamoRIO configuration
set_target_properties(dr_model PROPERTIES
    CXX_STANDARD 17
    CXX_STANDARD_REQUIRED ON
)


================================================
FILE: rvzr/model_dynamorio/backend/cli.cpp
================================================
///
/// File: Dr. Model Command Line Interface
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <algorithm>
#include <cstdint>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_tools.h>
#include <droption.h>

#include "cli.hpp"
#include "factory.hpp"

using std::string;

using dynamorio::droption::DROPTION_SCOPE_CLIENT;
using dynamorio::droption::droption_t;

static bool validate_tracer(cli_args_t *parsed_args);
static bool validate_speculator(cli_args_t *parsed_args);
static bool validate_taint_tracker(cli_args_t *parsed_args);

static const int max_reasonable_nesting = 100;
static const int max_reasonable_spec_window = 1000;

// =================================================================================================
// List of options
// =================================================================================================
namespace
{
// clang-format off
// General Configuration

// Mode selector: standalone vs serving as a backend for rvzr
const droption_t<string> op_mode(DROPTION_SCOPE_CLIENT,
                        "mode", "standalone",
                        "Mode of operation: standalone or rvzr",
                        "Mode of operation: "
                        "standalone (default) or rvzr (used as a backend for rvzr)");

// Tracer Configuration
const droption_t<string> op_tracer_name(DROPTION_SCOPE_CLIENT,
                        "tracer", "ct",
                        "Type of the tracer; equivalent to the observation clause of a contract",
                        "Type of the tracer; equivalent to the observation clause of a contract");
const droption_t<string> op_instrumented_func(DROPTION_SCOPE_CLIENT,
                        "instrumented-func", "__libc_start_main",
                        "Name of the function to instrument.",
                        "Name of the function to instrument.");
const droption_t<string> op_trace_output(DROPTION_SCOPE_CLIENT,
                        "trace-output", "rvzr_trace.dat",
                        "Where to save the trace (in binary format).",
                        "Where to save the trace (in binary format).");
const droption_t<bool>  op_print_trace(DROPTION_SCOPE_CLIENT,
                        "print-trace", false,
                        "Dump trace entries to STDOUT while they are being produced.",
                        "Dump trace entries to STDOUT while they are being produced.");

// Debugging
const droption_t<int>    op_log_level(DROPTION_SCOPE_CLIENT,
                        "log-level", 0,
                        "Verbosity level of the debug logger (0 = disabled).",
                        "Verbosity level of the debug logger (0 = disabled).");
const droption_t<string> op_debug_output(DROPTION_SCOPE_CLIENT,
                        "debug-trace-output", "rvzr_dbg_trace.dat",
                        "Where to save the debug log (in binary format).",
                        "Where to save the debug log (in binary format).");
const droption_t<bool>   op_print_dbg_trace(DROPTION_SCOPE_CLIENT,
                        "print-debug-trace", false,
                        "Dump log entries to STDOUT while they are being produced.",
                        "Dump log entries to STDOUT while they are being produced.");

// Speculator Configuration
const droption_t<string> op_speculator_name(DROPTION_SCOPE_CLIENT,
                        "speculator", "seq",
                        "Type of the speculator; equivalent to the execution clause of a contract",
                        "Type of the speculator; equivalent to the execution clause of a contract");
const droption_t<int>    op_max_nesting(DROPTION_SCOPE_CLIENT,
                        "max-nesting", 1,
                        "Maximum number of nested speculations.",
                        "Maximum number of nested speculations.");
const droption_t<int>    op_max_spec_window(DROPTION_SCOPE_CLIENT,
                        "max-spec-window", 250,
                        "Maximum number of speculative instructions.",
                        "Maximum number of speculative instructions.");
const droption_t<uint64_t> op_poison_value(DROPTION_SCOPE_CLIENT,
                        "poison-value", 0,
                        "Value to forward on speculative faulty loads. If 0, speculative loads cause a rollback.",
                        "Value to forward on speculative faulty loads. If 0, speculative loads cause a rollback.");

// Taint Tracker Configuration
const droption_t<bool>   op_enable_taint_tracker(DROPTION_SCOPE_CLIENT,
                        "enable-taint-tracker", false,
                        "Enable the taint tracker for contract-based input generation.",
                        "Enable the taint tracker for contract-based input generation.");
const droption_t<string> op_taint_output(DROPTION_SCOPE_CLIENT,
                        "taint-output", "",
                        "Where to save the taint information (in binary format).",
                        "Where to save the taint information (in binary format).");

// Listing Options
const droption_t<bool> op_list_tracers(DROPTION_SCOPE_CLIENT,
                        "list-tracers", false,
                        "List all available tracers (aka, observation clauses).",
                        "List all available tracers (aka, observation clauses).");
const droption_t<bool> op_list_speculators(DROPTION_SCOPE_CLIENT,
                        "list-speculators", false,
                        "List all available speculators (aka execution clauses).",
                        "List all available speculators (aka execution clauses).");
// clang-format on
} // namespace

// =================================================================================================
// CLI parser
// =================================================================================================
void parse_cli(int argc, const char **argv, DR_PARAM_OUT cli_args_t &parsed_args)
{
    // Parse the arguments using DynamoRIO's droption parser
    string err_msg;
    const bool parsed = dynamorio::droption::droption_parser_t::parse_argv(
        DROPTION_SCOPE_CLIENT, argc, argv, &err_msg, nullptr);

    // Print error message and abort if the arguments cannot be parsed
    if (not parsed) {
        dr_printf("Error parsing arguments: %s\n", err_msg.c_str());
        dr_printf(
            "Usage: %s\n",
            dynamorio::droption::droption_parser_t::usage_long(DROPTION_SCOPE_CLIENT).c_str());
        dr_abort();
    }

    // Select overall mode
    const std::string mode_str = op_mode.get_value();
    if (mode_str == "standalone") {
        parsed_args.mode = Mode::STANDALONE;
    } else if (mode_str == "rvzr") {
        parsed_args.mode = Mode::RVZR_BACKEND;
    } else {
        dr_printf("Invalid mode: %s\n", mode_str.c_str());
        dr_abort();
    }

    // Set the parsed arguments
    parsed_args.tracer_type = op_tracer_name.get_value();
    parsed_args.instrumented_func = op_instrumented_func.get_value();
    parsed_args.trace_output = op_trace_output.get_value();
    parsed_args.print_trace = op_print_trace.get_value();
    parsed_args.log_level = op_log_level.get_value();
    parsed_args.debug_output = op_debug_output.get_value();
    parsed_args.print_dbg_trace = op_print_dbg_trace.get_value();
    parsed_args.speculator_type = op_speculator_name.get_value();
    parsed_args.max_nesting = op_max_nesting.get_value();
    parsed_args.max_spec_window = op_max_spec_window.get_value();
    parsed_args.enable_taint_tracker = op_enable_taint_tracker.get_value();
    parsed_args.taint_output = op_taint_output.get_value();
    parsed_args.list_tracers = op_list_tracers.get_value();
    parsed_args.list_speculators = op_list_speculators.get_value();
    uint64_t poison_value = op_poison_value.get_value();
    if (poison_value == 0) {
        parsed_args.poison_value = {};
    } else {
        parsed_args.poison_value = poison_value;
    }

    // Check values
    if (not validate_tracer(&parsed_args)) {
        dr_abort();
    }
    if (not validate_speculator(&parsed_args)) {
        dr_abort();
    }
    if (not validate_taint_tracker(&parsed_args)) {
        dr_abort();
    }
}

// =================================================================================================
// Validators
// =================================================================================================
bool validate_tracer(cli_args_t *parsed_args)
{
    // Check if the tracer type is supported
    auto tracer_names = get_tracer_list();
    auto match = std::find(tracer_names.begin(), tracer_names.end(), parsed_args->tracer_type);
    if (match == tracer_names.end()) {
        dr_printf("Invalid tracer type: %s\n", parsed_args->tracer_type.c_str());
        dr_printf("Available tracers: [ ");
        for (const auto &tracer : tracer_names) {
            dr_printf("%s, ", tracer.c_str());
        }
        dr_printf("]\n");
        return false;
    }

    return true;
}

bool validate_speculator(cli_args_t *parsed_args)
{
    // Check if the speculator type is supported
    auto speculator_names = get_speculator_list();
    auto match =
        std::find(speculator_names.begin(), speculator_names.end(), parsed_args->speculator_type);
    if (match == speculator_names.end()) {
        dr_printf("Invalid speculator type: %s\n", parsed_args->speculator_type.c_str());
        dr_printf("Available speculators: [ ");
        for (const auto &spec : speculator_names) {
            dr_printf("%s, ", spec.c_str());
        }
        dr_printf("]\n");
        return false;
    }

    // Check if the maximum nesting level is valid
    // - Negative or zero values have no meaning;
    // - Anything greater than 100 is unrealistic on modern hardware
    if (parsed_args->max_nesting <= 0) {
        dr_printf("Invalid maximum nesting level: %d\n", parsed_args->max_nesting);
        dr_printf("Maximum nesting level must be greater than 0.\n");
        return false;
    }
    if (parsed_args->max_nesting > max_reasonable_nesting) {
        dr_printf("Invalid maximum nesting level: %d\n", parsed_args->max_nesting);
        dr_printf("Maximum nesting level must be less than or equal to 100.\n");
        return false;
    }

    // Check if the maximum speculation window is valid
    // - Negative or zero values have no meaning;
    // - Anything greater than 1000 is unrealistic on modern hardware
    if (parsed_args->max_spec_window <= 0) {
        dr_printf("Invalid maximum speculation window: %d\n", parsed_args->max_spec_window);
        dr_printf("Maximum speculation window must be greater than 0.\n");
        return false;
    }
    if (parsed_args->max_spec_window > max_reasonable_spec_window) {
        dr_printf("Invalid maximum speculation window: %d\n", parsed_args->max_spec_window);
        dr_printf("Maximum speculation window must be less than or equal to 1000.\n");
        return false;
    }

    return true;
}

static bool validate_taint_tracker(cli_args_t *parsed_args)
{
    // Taint tracker is only available for backend mode
    if (parsed_args->enable_taint_tracker and parsed_args->mode != Mode::RVZR_BACKEND) {
        dr_printf(
            "Taint tracker can only be enabled when the model is used as a backend for rvzr.\n");
        return false;
    }

    // If the taint tracker is enabled, check that the output path is valid
    if (parsed_args->enable_taint_tracker) {
        if (parsed_args->taint_output.empty()) {
            dr_printf(
                "Taint tracker output path cannot be empty when the taint tracker is enabled.\n");
            return false;
        }
    }

    return true;
}


================================================
FILE: rvzr/model_dynamorio/backend/dispatcher.cpp
================================================
///
/// File: Class responsible for instrumenting instructions
///       in the target application with a call to a dispatch function.
///       The function, in turn, calls service classes (e.g., Tracer, Speculator, etc)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstdint>
#include <memory>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_tools.h>
#include <drmgr.h>
#include <drwrap.h>

#include "cli.hpp"
#include "dispatcher.hpp"
#include "factory.hpp"
#include "observables.hpp"
#include "util.hpp"

using std::string;

/// Defined by model.cpp
extern std::unique_ptr<Dispatcher> glob_dispatcher; // NOLINT

// =================================================================================================
// Runtime functions
// =================================================================================================

/// @brief Dispatch function that calls the per-instruction functions in the service modules
/// @param mc Machine context of the current instruction
/// @param bundle The bundle of service modules to be called
/// @param instr Observables of the current instruction
/// @return The PC of the next instruction to be executed (if redirection is necessary);
///         otherwise, 0 (zero)
static pc_t instruction_dispatch(dr_mcontext_t *mc, void *dc, const Dispatcher *dispatcher,
                                 instr_obs_t instr)
{
    dispatcher->logger->log_instruction(instr, mc, dispatcher->speculator->get_nesting_level());
    dispatcher->taint_tracker->track_instruction(instr, mc, dc);
    dispatcher->tracer->observe_instruction(instr, mc, dc);
    const pc_t next_pc = dispatcher->speculator->handle_instruction(instr, mc, dc);
    return next_pc;
}

/// @brief Dispatch function that calls the per-memory-access functions in the service modules
/// @param drcontext
/// @param mc
/// @param bundle
/// @param pc
/// @return The PC of the next instruction to be executed (if redirection is necessary);
///         otherwise, 0 (zero)
static pc_t mem_access_dispatch(void *dc, dr_mcontext_t *mc, const Dispatcher *dispatcher, pc_t pc)
{
    // Decode the instruction using the shared cache to extract its memory references
    instr_t *instr = dispatcher->decoder->get_decoded_instr(dc, (byte *)pc);

    // Identify the size of the memory reference
    // (assumed that all memory references for the instruction are of the same size)
    const uint64_t size = instr_memory_reference_size(instr);

    // Loop over all memory operands and call service modules for each
    uint index = 0;
    bool is_write = false;
    app_pc addr = nullptr;
    while (instr_compute_address_ex(instr, mc, index, &addr, &is_write)) {
        dispatcher->logger->log_mem_access(is_write, addr, size);
        dispatcher->taint_tracker->track_memory_access(is_write, (void *)addr, size);
        dispatcher->tracer->observe_mem_access(is_write, addr, size);
        if (not dispatcher->speculator->handle_mem_access(is_write, (void *)addr, size)) {
            return dispatcher->speculator->rollback(mc);
        }

        index++;
    }

    return 0;
}

/// @brief Callback function called for every instruction in the instrumented function
/// @param bundle The bundle of service modules to be called
/// @param opcode The opcode of the instruction
/// @param pc The program counter (address) of the instruction
/// @param has_mem_ref Flag indicating whether the instruction has a memory reference
static void dispatch_callback(uint64_t opcode, uint64_t pc, uint64_t has_mem_ref)
{
    // Get the global dispatcher
    const Dispatcher *dispatcher = glob_dispatcher.get();
    DR_ASSERT_MSG(dispatcher != nullptr, "[ERROR] glob_dispatcher is null\n");

    // Nothing to do if we're outside of the instrumented function
    if (not dispatcher->is_instrumentation_on()) {
        return;
    }

    // get current context
    void *drcontext = dr_get_current_drcontext();
    dr_mcontext_t mc = {sizeof(mc), DR_MC_ALL};
    dr_get_mcontext(drcontext, &mc);

    // create an instruction instance for the current instruction
    const instr_obs_t instr = {
        .opcode = opcode,
        .pc = (pc_t)pc,
        .has_mem_access = (bool)has_mem_ref,
    };

    // pass down to instruction dispatch functions and redirect execution if needed
    pc_t next_pc = instruction_dispatch(&mc, drcontext, dispatcher, instr);
    if (next_pc != 0) {
        mc.pc = (byte *)next_pc;
        dr_redirect_execution(&mc);
        return; // unreachable
    }
    dr_set_mcontext(drcontext, &mc);
    if (has_mem_ref == 0) {
        return;
    }

    // pass down to memory access dispatch functions and redirect execution if needed
    next_pc = mem_access_dispatch(drcontext, &mc, dispatcher, instr.pc);
    if (next_pc != 0) {
        mc.pc = (byte *)next_pc;
        dr_redirect_execution(&mc);
        return; // unreachable
    }
    dr_set_mcontext(drcontext, &mc);
}

/// @brief Callback function called upon return from the instrumented function
static void exit_callback()
{
    // Get the global dispatcher
    Dispatcher *dispatcher = glob_dispatcher.get();
    DR_ASSERT_MSG(dispatcher != nullptr, "[ERROR] glob_dispatcher is null\n");
    DR_ASSERT_MSG(dispatcher->is_instrumentation_on(),
                  "[ERROR] Instrumentation disabled when exiting instrumented function");

    // get current context
    void *drcontext = dr_get_current_drcontext();
    dr_mcontext_t mc = {sizeof(mc), DR_MC_ALL};
    dr_get_mcontext(drcontext, &mc);

    // Rollback speculation if we're speculatively exiting the target function
    if (dispatcher->speculator->in_speculation) {
        // Perform rollback
        const pc_t newpc = dispatcher->speculator->rollback(&mc);
        mc.pc = (byte *)newpc;
        dr_redirect_execution(&mc);
        return; // unreachable
    }

    // Architectural exit: stop the instrumentation
    flush_bb_cache();
    dispatcher->finalize();
    dr_set_mcontext(drcontext, &mc);
}

bool Dispatcher::handle_exception(void *drcontext, dr_siginfo_t *siginfo) const
{
    logger->log_exception(siginfo);
    // Exceptions on speculative paths are handled by the speculator.
    const bool redirected = speculator->handle_exception(drcontext, siginfo);
    if (redirected)
        return true; // intercepted

    // Architectural exceptions are forwarded to the program
    dr_printf("[XCPT] Dispatcher::handle_exception: exception on a non-speculative path\n");
    tracer->observe_exception(siginfo);
    return false; // not intercepted
}

// =================================================================================================
// Instrumentation-time Methods
// =================================================================================================
void Dispatcher::start()
{
    DR_ASSERT_MSG(not is_initialized,
                  "[ERROR] Attempting to initialize Dispatcher multiple times.");

    instrumentation_on = true;
    is_initialized = true;

    // Turn service modules on
    taint_tracker->enable();
    tracer->enable();
    speculator->enable();
}

void Dispatcher::restart()
{
    DR_ASSERT_MSG(is_initialized,
                  "[ERROR] Attempting to restart Dispatcher without initialization.");

    instrumentation_on = true;

    // Turn service modules on
    taint_tracker->enable();
    tracer->enable();
    speculator->enable();
}

void Dispatcher::finalize()
{
    if (not instrumentation_on)
        return;

    // Turn service modules off
    taint_tracker->finalize();
    tracer->finalize();
    speculator->disable();

    instrumentation_on = false;
}

dr_emit_flags_t Dispatcher::instrument_instruction(void *drcontext, instrlist_t *bb,
                                                   instr_t *instr) const
{
    // Nothing to do if we're outside of the instrumented function
    if (not instrumentation_on) {
        return DR_EMIT_DEFAULT;
    }

    // Get a pointer to the instruction's original form (pre event_bb_app2app call)
    instr_t *org_instr = drmgr_orig_app_instr_for_fetch(drcontext);
    if (org_instr == nullptr) { // DR tell us that this instruction should be skipped
        return DR_EMIT_DEFAULT;
    }

    // Get instruction parameters
    const opnd_t opcode = OPND_CREATE_INT64(instr_get_opcode(org_instr));
    const opnd_t pc_op = OPND_CREATE_INTPTR(instr_get_app_pc(org_instr));
    const opnd_t has_mem_ref =
        OPND_CREATE_INT64(instr_reads_memory(org_instr) or instr_writes_memory(org_instr));

    // Add a clean call to the dispatch callback, which will forward the call to the service
    // modules
    const int dispatch_callback_nargs = 3;
    dr_insert_clean_call(drcontext, bb, instr, (void *)dispatch_callback, false,
                         dispatch_callback_nargs, opcode, pc_op, has_mem_ref);

    return DR_EMIT_DEFAULT;
}

void Dispatcher::instrument_exit(void *drcontext, instrlist_t *bb, instr_t *instr) const
{
    dr_insert_clean_call(drcontext, bb, instr, (void *)exit_callback, false, 0);
}

// =================================================================================================
// Constructors and Destructors
// =================================================================================================
Dispatcher::Dispatcher(cli_args_t *cli_args) : instrumentation_on(false)
{
    // Create service modules
    logger = create_logger(cli_args->debug_output, cli_args->log_level, cli_args->print_dbg_trace);
    decoder = std::make_unique<Decoder>();
    taint_tracker = create_taint_tracker(cli_args->enable_taint_tracker, cli_args->taint_output,
                                         *logger, *decoder);
    tracer = create_tracer(cli_args->tracer_type, cli_args->trace_output, *logger, *taint_tracker,
                           *decoder, cli_args->print_trace);
    speculator = create_speculator(cli_args->speculator_type, cli_args->max_nesting,
                                   cli_args->max_spec_window, *logger, *taint_tracker, *decoder,
                                   cli_args->poison_value);
}

Dispatcher::~Dispatcher()
{
    logger.reset();
    decoder.reset();
    tracer.reset();
    speculator.reset();
    taint_tracker.reset();
}


================================================
FILE: rvzr/model_dynamorio/backend/factory.cpp
================================================
///
/// File: Implementation factory functions defined in factory.hpp
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <functional>
#include <memory>
#include <stdexcept>
#include <string>
#include <unordered_map>
#include <vector>

#include "factory.hpp"
#include "logger.hpp"
#include "speculator_abc.hpp"
#include "speculators/cond.hpp"
#include "speculators/seq.hpp"
#include "taint_tracker.hpp"
#include "tracer_abc.hpp"
#include "tracers/ct.hpp"
#include "tracers/ind.hpp"
#include "tracers/pc.hpp"
#include "types/decoder.hpp"

using std::function;
using std::string;
using std::unique_ptr;
using std::vector;

namespace
{

const std::unordered_map<string, function<unique_ptr<TracerABC>(const string &, Logger &,
                                                                TaintTracker &, Decoder &, bool)>>
    tracer_factories = {
        {
            "ct",
            [](const string &out_path, Logger &logger, TaintTracker &taint_tracker,
               Decoder &decoder, bool print) {
                return std::make_unique<TracerCT>(out_path, logger, taint_tracker, decoder, print);
            },
        },
        {
            "pc",
            [](const string &out_path, Logger &logger, TaintTracker &taint_tracker,
               Decoder &decoder, bool print) {
                return std::make_unique<TracerPC>(out_path, logger, taint_tracker, decoder, print);
            },
        },
        {
            "ind",
            [](const string &out_path, Logger &logger, TaintTracker &taint_tracker,
               Decoder &decoder, bool print) {
                return std::make_unique<TracerInd>(out_path, logger, taint_tracker, decoder, print);
            },
        }};

const std::unordered_map<string,
                         function<unique_ptr<SpeculatorABC>(int, int, Logger &, TaintTracker &,
                                                            Decoder &, std::optional<uint64_t>)>>
    speculator_factories = {
        {
            "seq",
            [](int max_nesting_, int max_spec_window_, Logger &logger, TaintTracker &taint_tracker,
               Decoder &decoder, std::optional<uint64_t> poison_value) {
                return std::make_unique<SpeculatorSeq>(max_nesting_, max_spec_window_, logger,
                                                       taint_tracker, decoder, poison_value);
            },
        },
        {
            "cond",
            [](int max_nesting_, int max_spec_window_, Logger &logger, TaintTracker &taint_tracker,
               Decoder &decoder, std::optional<uint64_t> poison_value) {
                return std::make_unique<SpeculatorCond>(max_nesting_, max_spec_window_, logger,
                                                        taint_tracker, decoder, poison_value);
            },
        }};

} // namespace

unique_ptr<TracerABC> create_tracer(const string &tracer_type, const string &out_path,
                                    Logger &logger, TaintTracker &taint_tracker, Decoder &decoder,
                                    bool print)
{
    try {
        return tracer_factories.at(tracer_type)(out_path, logger, taint_tracker, decoder, print);
    } catch (const std::out_of_range &e) {
        throw std::invalid_argument("Unexpected tracer type: " + tracer_type);
    }
}

vector<string> get_tracer_list()
{
    vector<string> tracer_list;
    tracer_list.reserve(tracer_factories.size());
    for (const auto &tracer : tracer_factories) {
        tracer_list.push_back(tracer.first);
    }
    return tracer_list;
}

std::unique_ptr<SpeculatorABC> create_speculator(const string &speculator_type, int max_nesting_,
                                                 int max_spec_window_, Logger &logger,
                                                 TaintTracker &taint_tracker, Decoder &decoder,
                                                 std::optional<uint64_t> poison_value)
{
    try {
        return speculator_factories.at(speculator_type)(max_nesting_, max_spec_window_, logger,
                                                        taint_tracker, decoder, poison_value);
    } catch (const std::out_of_range &e) {
        throw std::invalid_argument("Unexpected speculator type: " + speculator_type);
    }
}

vector<string> get_speculator_list()
{
    vector<string> speculator_list;
    speculator_list.reserve(speculator_factories.size());
    for (const auto &speculator : speculator_factories) {
        speculator_list.push_back(speculator.first);
    }
    return speculator_list;
}

unique_ptr<Logger> create_logger(const string &out_path, int level, bool print)
{
    // Sanitize log level
    if (level >= Logger::log_level_t::LOG_MAX) {
        level = Logger::log_level_t::LOG_MAX - 1;
    } else if (level < 0) {
        level = 0;
    }

    return std::make_unique<Logger>(out_path, (Logger::log_level_t)level, print);
}

std::unique_ptr<TaintTracker> create_taint_tracker(bool enable, const std::string &out_path,
                                                   Logger &logger, Decoder &decoder)
{
    if (enable) {
        return std::make_unique<TaintTracker>(out_path, logger, decoder);
    }
    return std::make_unique<NoneTaintTracker>(out_path, logger, decoder);
}


================================================
FILE: rvzr/model_dynamorio/backend/include/cli.hpp
================================================
///
/// File: Header for the Command Line Interface (cli.cpp)
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>
#include <optional>
#include <string>

#include <dr_defines.h> // DR_PARAM_OUT

enum class Mode : uint8_t {
    STANDALONE,
    RVZR_BACKEND,
};

struct cli_args_t {
    Mode mode;
    std::string tracer_type;
    std::string instrumented_func;
    std::string trace_output;
    bool print_trace;
    int log_level;
    std::string debug_output;
    bool print_dbg_trace;
    std::string speculator_type;
    int max_nesting;
    int max_spec_window;
    bool enable_taint_tracker;
    std::string taint_output;
    bool list_tracers;
    bool list_speculators;
    std::optional<uint64_t> poison_value;
};

/// @brief Parse the command line arguments
/// @param argc Standard argument count
/// @param argv Standard argument vector
/// @param parsed_args Output structure with the parsed arguments
/// @return void
/// @exception dr_abort() if the arguments cannot be parsed
void parse_cli(int argc, const char **argv, DR_PARAM_OUT cli_args_t &parsed_args);


================================================
FILE: rvzr/model_dynamorio/backend/include/dispatcher.hpp
================================================
///
/// File: Header for the Dispatcher class,
///       responsible for instrumenting the target application with calls to service classes
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <memory>

#include <dr_api.h> // NOLINT

#include "cli.hpp"
#include "logger.hpp"
#include "speculator_abc.hpp"
#include "taint_tracker.hpp"
#include "tracer_abc.hpp"
#include "types/decoder.hpp"

/// @brief Dispatcher class responsible for adding instrumentation to instructions
///        in the target application and calling the appropriate
///        service classes (e.g., Tracer, Speculator, etc)
class Dispatcher
{
  public:
    Dispatcher(cli_args_t *cli_args);
    virtual ~Dispatcher();
    Dispatcher(const Dispatcher &) = delete;
    Dispatcher &operator=(const Dispatcher &) = delete;
    Dispatcher(Dispatcher &&) = delete;
    Dispatcher &operator=(Dispatcher &&) = delete;

    // ---------------------------------------------------------------------------------------------
    // Public Attributes

    /// @param logger: shared logger for event tracing
    std::unique_ptr<Logger> logger = nullptr;
    /// @param decoder: shared instruction decode cache used by all modules
    std::unique_ptr<Decoder> decoder = nullptr;
    /// @param tracer: implements observation clause
    std::unique_ptr<TracerABC> tracer = nullptr;
    /// @param speculator: implements execution clause
    std::unique_ptr<SpeculatorABC> speculator = nullptr;
    /// @param taint_tracker: implements taint tracking for input boosting
    ///        (aka contract-based input generation)
    std::unique_ptr<TaintTracker> taint_tracker = nullptr;

    /// @param initialized: true if the dispatcher has been already initialized (start was called)
    bool is_initialized = false;

    // ---------------------------------------------------------------------------------------------
    // Public Methods

    /// @brief Starts the instrumentation process for a wrapped function
    /// @return void
    void start();

    /// @brief Restarts the instrumentation process for a wrapped function
    /// @return void
    void restart();

    /// @brief Finalizes the instrumentation process
    /// @return void
    void finalize();

    /// @brief Check if the instrumentation has started and is not finalized.
    [[nodiscard]] bool is_instrumentation_on() const { return instrumentation_on; };

    /// @brief Instruments the instruction \p instr with calls to callback functions of the
    /// corresponding type
    /// @param drcontext The drcontext of the current thread
    /// @param bb The basic block to be instrumented
    /// @param instr The instruction to instrument
    /// @return Flags to be consumed by DynamoRIO instrumentation callbacks
    dr_emit_flags_t instrument_instruction(void *drcontext, instrlist_t *bb, instr_t *instr) const;

    /// @brief Instruments the exit instruction with the finalization callback
    /// @param drcontext The drcontext of the current thread
    /// @param bb The basic block to be instrumented
    /// @param instr The instruction to instrument
    /// @return Flags to be consumed by DynamoRIO instrumentation callbacks
    void instrument_exit(void *drcontext, instrlist_t *bb, instr_t *instr) const;

    /// @brief Passes the exception down to service modules for handling
    /// @param drcontext The drcontext of the current thread
    /// @param excpt Pointer to the exception data
    /// @return True if the exception has been handled (control-flow should be redirected)
    bool handle_exception(void *drcontext, dr_siginfo_t *siginfo) const;

    // ---------------------------------------------------------------------------------------------
    // Private Attributes
  private:
    bool instrumentation_on;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/factory.hpp
================================================
///
/// File: Implementation of the Factory Function pattern to create instances
/// of core classes in the DR Model
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <memory>
#include <string>
#include <vector>

#include "speculator_abc.hpp"
#include "taint_tracker.hpp"
#include "tracer_abc.hpp"
#include "types/decoder.hpp"

/// @brief Create a tracer instance based on the tracer name
/// @param tracer_name The name of the tracer to create
/// @param out_path The path of the trace output file
/// @param logger Where to log events for debugging
/// @param taint_tracker Taint tracker for input boosting
/// @param decoder Shared instruction decode cache
/// @param print Print every trace entry to STDOUT during tracing (slow)
/// @return A unique pointer to the created tracer instance
/// @throw std::invalid_argument if the tracer name is unknown
std::unique_ptr<TracerABC> create_tracer(const std::string &tracer_type,
                                         const std::string &out_path, Logger &logger,
                                         TaintTracker &taint_tracker, Decoder &decoder, bool print);

/// @brief Get a list of all available tracers
/// @return A list of all available tracers
std::vector<std::string> get_tracer_list();

/// @brief Create a speculator instance based on the speculator name
/// @param speculator_name The name of the speculator to create
/// @param max_nesting_ The maximum nesting level for the speculator
/// @param max_spec_window_ The maximum size of the speculation window
/// @param logger Where to log events for debugging
/// @param taint_tracker Taint tracker for input boosting
/// @param decoder Shared instruction decode cache
/// @param poison_value If not empty, this value will be forwarded on speculative faulty loads
/// @return A unique pointer to the created speculator instance
/// @throw std::invalid_argument if the speculator name is unknown
std::unique_ptr<SpeculatorABC> create_speculator(const std::string &speculator_type,
                                                 int max_nesting_, int max_spec_window_,
                                                 Logger &logger, TaintTracker &taint_tracker,
                                                 Decoder &decoder,
                                                 std::optional<uint64_t> poison_value);

/// @brief Get a list of all available speculators
/// @return A list of all available speculators
std::vector<std::string> get_speculator_list();

/// @brief Create the shared logger to log debug events
/// @param out_path Where the logger should log
/// @param level Verbosity level of the logger
std::unique_ptr<Logger> create_logger(const std::string &out_path, int level, bool print);

/// @brief Create the taint tracker instance
/// @param enable Whether to enable taint tracking
/// @param out_path Where to write taint tracking output
/// @param logger Where to log events for debugging
/// @param decoder Shared instruction decode cache
/// @return A unique ptr to the created taint tracker instance
std::unique_ptr<TaintTracker> create_taint_tracker(bool enable, const std::string &out_path,
                                                   Logger &logger, Decoder &decoder);


================================================
FILE: rvzr/model_dynamorio/backend/include/logger.hpp
================================================
///
/// File: The Logger centralizes the collection of debug traces from different components
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>

#include <dr_defines.h>
#include <dr_events.h>

#include "observables.hpp"
#include "types/debug_trace.hpp"
#include "types/file_buffer.hpp"

// =================================================================================================
// Class Definition
// =================================================================================================

/// @brief The Logger centralizes the collection of debug traces from different components
class Logger
{
  public:
    /// @brief Verbosity level of the logger
    enum log_level_t : uint8_t {
        LOG_NONE = 0,         // Disabled
        LOG_INSTRUCTIONS = 1, // Report PC, registers, memory operations and exceptions
        LOG_SPEC = 2,         // Also report rollbacks and checkpoints
        LOG_DISASM = 3,       // Also report module_name+offset of each instruction
        LOG_MAX = 4,
    };

    /// @param logs_path Path of the file where to dump the binary logs
    /// @param log_level Verbosity level of the logger
    /// @param print If true, every debug entry will be printed to STDOUT when inserted
    Logger(const std::string &logs_path, log_level_t log_level, bool print);
    ~Logger();
    Logger(const Logger &) = delete;
    Logger(Logger &&) = delete;
    Logger &operator=(const Logger &) = delete;
    Logger &operator=(Logger &&) = delete;

    /// @return true if logging is enabled
    [[nodiscard]] bool is_enabled() const { return log_level > LOG_NONE; }
    /// @brief close the file that backs the logger
    void close();
    /// @return the path of the file where the logs are dumped to
    [[nodiscard]] const std::string &get_filename() const;

    /// @brief log the PC and registers of the current instruction, and whether it is speculative
    void log_instruction(instr_obs_t instr, dr_mcontext_t *mc, unsigned int nesting_level);
    /// @brief log a memory operation, including the value that is currently stored at the address
    void log_mem_access(bool is_write, void *address, uint64_t size);
    /// @brief log an exception
    void log_exception(dr_siginfo_t *siginfo);
    /// @brief log a checkpoint that marks a new speculative window
    void log_checkpoint(pc_t rollback_pc, uint64_t cur_window_size, size_t cur_store_log_size);
    /// @brief log a rollback that marks the end of the current speculative window
    void log_rollback(unsigned nesting, pc_t rollback_pc);
    /// @brief log a store that is executed to restore the memory state during a rollback
    void log_rollback_store(uint64_t addr, uint64_t val, size_t size, uint64_t nesting_level);
    /// @brief log end of trace
    void log_eot();

  private:
    static constexpr const unsigned buf_sz = 8 * 1024;
    /// @param the actual log, implemented as a file-backed buffer
    FileBackedBuf<debug_trace_entry_t, buf_sz> log;
    /// @param verbosity level of the logger
    const log_level_t log_level;
    /// @param current nesting level of speculation
    uint8_t cur_nesting_level;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/observables.hpp
================================================
///
/// File: Collection of types describing an instruction
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>

typedef uint64_t opcode_t;
typedef uint64_t pc_t;

/// @brief Structure describing observable information of an instruction
typedef struct {
    uint64_t opcode;
    uint64_t pc;
    bool has_mem_access;
} instr_obs_t;

/// @brief Structure describing observable information of a memory access
typedef struct {
    uint64_t addr;
    uint64_t size;
} mem_access_obs_t;


================================================
FILE: rvzr/model_dynamorio/backend/include/speculator_abc.hpp
================================================
///
/// File: Header for speculator_abc.cpp
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstddef>
#include <cstdint>
#include <optional>
#include <vector>

#include <dr_api.h> // NOLINT

#include "logger.hpp"
#include "observables.hpp"
#include "taint_tracker.hpp"
#include "types/decoder.hpp"
#include "types/store_log.hpp"

using std::uint64_t;

// =================================================================================================
// Constants and Types
// =================================================================================================

typedef struct {
    pc_t rollback_pc;
    uint64_t spec_window;
    dr_mcontext_t mc;
} checkpoint_t;

// =================================================================================================
// Class Definition
// =================================================================================================

/// @brief Abstract base class for all speculators
class SpeculatorABC
{
  public:
    SpeculatorABC(int max_nesting_, int max_spec_window_, Logger &logger,
                  TaintTracker &taint_tracker, Decoder &decoder,
                  std::optional<uint64_t> poison_value)
        : max_nesting(max_nesting_), max_spec_window(max_spec_window_), logger(logger),
          taint_tracker(taint_tracker), decoder(decoder), poison_value(poison_value)
    {
    }
    virtual ~SpeculatorABC() = default;
    SpeculatorABC(const SpeculatorABC &) = delete;
    SpeculatorABC &operator=(const SpeculatorABC &) = delete;
    SpeculatorABC(SpeculatorABC &&) = delete;
    SpeculatorABC &operator=(SpeculatorABC &&) = delete;

    // ---------------------------------------------------------------------------------------------
    // Public Attributes

    /// @param Boolean flag indicating whether the speculator is currently active
    bool in_speculation = false;

    // ---------------------------------------------------------------------------------------------
    // Public Methods

    void enable();
    void disable();
    [[nodiscard]] unsigned int get_nesting_level() const { return nesting; }

    /// @brief Rollback to the last checkpoint, thus undoing all speculative changes to the process
    ///        state.
    ///
    ///        NOTE: The `rollback` method is public, because it a rollback could be caused
    ///        by external events, such exceptions. The `checkpoint` method, however, is protected
    ///        because it should never be called externally; instead, the `handle_instruction`
    ///        and `handle_mem_access` methods will call it internally as a part of
    ///        the speculation process.
    ///
    /// @param mc The machine context of the current instruction
    /// @return The PC of the next instruction to be executed
    virtual pc_t rollback(dr_mcontext_t *mc);

    /// @brief Check if the speculation should be skipped (e.g., due to exceeding the maximum
    ///        nesting, speculation window, or other conditions).
    /// @param void
    /// @return true if speculation should be skipped, false otherwise
    [[nodiscard]] bool skip_speculation() const;

    /// @brief Emulates speculation for the given instruction according to the target contract.
    ///        Each subclass implements a different contract, hence the implementation
    ///        of this method is different for each subclass.
    /// @param opcode The opcode of the instruction
    /// @param pc The program counter (address) of the instruction
    /// @param mc The machine context of the instruction
    /// @param dc The current DR context
    /// @return 0 if no speculation was triggered or no redirection is needed;
    ///         otherwise, the PC of the instruction to which the execution should be redirected
    virtual pc_t handle_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc);

    /// @brief Emulates speculation for the memory access according to the target contract.
    ///        Each subclass implements a different contract, hence the implementation
    ///        of this method is different for each subclass.
    /// @param type The type of the memory access (read or write)
    /// @param address The address of the memory access
    /// @param size The size of the memory access
    /// @return false if the memory access is invalid and is going to produce an exception
    virtual bool handle_mem_access(bool is_write, void *address, uint64_t size);

    /// @brief Notifies the speculator of an exception, needed to possibly reset internal state.
    /// @return Whether the speculator redirected execution or not.
    virtual bool handle_exception(void *drcontext, dr_siginfo_t *siginfo);

  protected:
    // ---------------------------------------------------------------------------------------------
    // Protected Attributes

    /// @brief Boolean flag indicating whether the speculation is enabled
    bool enabled = false;

    /// @param Stack of program state checkpoints (one checkpoint per nested speculation level)
    std::vector<checkpoint_t> checkpoints;

    /// @param Log of store operations performed during speculation; used to undo the operations
    ///        during rollback
    StoreLog store_log;

    /// @param Maximum number of nested speculations
    unsigned int max_nesting = 0;

    /// @param Current speculation nesting level
    unsigned int nesting = 0;

    /// @param Maximum speculation window size
    unsigned int max_spec_window = 0;

    /// @param Current speculation window
    unsigned int spec_window = 0;

    /// @param Should faulty loads cause a rollback or continue speculation with a poisoned value?
    const std::optional<uint64_t> poison_value;

    /// @param Used to log checkpoint and rollback events
    Logger &logger;

    /// @brief Used to taint-track dependencies between input values and contract trace
    TaintTracker &taint_tracker;

    /// @brief Shared cache for decoded instructions
    Decoder &decoder;

    // ---------------------------------------------------------------------------------------------
    // Protected Methods

    /// @brief Record a checkpoint of the current state and store it in the `checkpoints` stack
    /// @param mc The machine context of the current instruction
    /// @param pc The program counter (address) of the instruction
    /// @return void
    virtual void checkpoint(dr_mcontext_t *mc, pc_t pc);
};


================================================
FILE: rvzr/model_dynamorio/backend/include/speculators/cond.hpp
================================================
///
/// File: Header for the COND Speculator
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <dr_api.h> // NOLINT

#include "speculator_abc.hpp"

/// @brief Conditional Branch Misprediction (COND) Speculator;
///        This speculator implements a conditional branch misprediction
///        by flipping the conditions for all conditional branches.
class SpeculatorCond : public SpeculatorABC
{
  public:
    using SpeculatorABC::SpeculatorABC;

    /// @brief If the current instruction is a branch, then the speculator will
    ///        checkpoint the process state and emulate a branch misprediction
    ///        by jumping to the opposite branch target (e.g., will take the branch if it
    ///        was supposed to fall though).
    ///
    /// @param instr The current instruction
    /// @param mc The machine context of the instruction
    /// @param dc The current DR context
    /// @return 0 if no speculation was triggered or no redirection is needed;
    ///         otherwise, the PC of the instruction to which the execution should be redirected
    pc_t handle_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc) override;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/speculators/seq.hpp
================================================
///
/// File: Header for the Seq (Sequential) Speculator
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include "speculator_abc.hpp"

/// @brief Sequential (SEQ) Speculator;
///        This speculator implements a sequential execution model with no speculation
///        It is the simplest form of a speculator and it used to test the parts of the instruction
///        set where no speculation is expected
class SpeculatorSeq : public SpeculatorABC
{
  public:
    using SpeculatorABC::SpeculatorABC;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/taint_tracker.hpp
================================================
///
/// File: Header for Taint Tracker class,
///       which performs backward taint analysis to identify parts of the input that influence
///       contract traces.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>
#include <fstream>
#include <iostream>
#include <map>
#include <memory>
#include <set>
#include <sstream>
#include <string>
#include <vector>

#include <dr_api.h> // NOLINT
#include <dr_ir_opnd.h>

#include "logger.hpp"
#include "observables.hpp"
#include "types/decoder.hpp"
#include "types/input_taint.hpp"

// =================================================================================================
// Constants and Types
// =================================================================================================
typedef reg_id_t tracker_reg_label_t;
typedef uint64_t tracked_mem_label_t;
typedef uint64_t tracked_label_t;

// Extra register IDs for those registers that do not have a direct mapping in DynamoRIO
// We use here the values that are guaranteed to be unused by other registers
// in our logic (this defined in taint_tracer.cpp:normalize_reg) and thus are safe to re-use.
#define DR_REG_RIP DR_REG_NULL
#define DR_FLAG_CF DR_REG_AX // all GPRs are normalized to 64-bit, so AX and others are free
#define DR_FLAG_PF DR_REG_BX
#define DR_FLAG_AF DR_REG_CX
#define DR_FLAG_ZF DR_REG_DX
#define DR_FLAG_SF DR_REG_SI
#define DR_FLAG_OF DR_REG_DI
#define DR_FLAG_DF DR_REG_R8W

/// @brief Register IDs used by RVZR code
/// must match the register offsets defined in the rvzr/sandbox.py
enum class RVZRRegId : uint64_t {
    RVZR_REG_RAX = 0x2000,
    RVZR_REG_RBX = 0x2008,
    RVZR_REG_RCX = 0x2010,
    RVZR_REG_RDX = 0x2018,
    RVZR_REG_RSI = 0x2020,
    RVZR_REG_RDI = 0x2028,
    RVZR_REG_FLAGS = 0x2030,
    RVZR_REG_XMM0 = 0x2040,
    RVZR_REG_XMM1 = 0x2060,
    RVZR_REG_XMM2 = 0x2080,
    RVZR_REG_XMM3 = 0x20A0,
    RVZR_REG_XMM4 = 0x20C0,
    RVZR_REG_XMM5 = 0x20E0,
    RVZR_REG_XMM6 = 0x2100,
    RVZR_REG_XMM7 = 0x2120,
    RVZR_REG_IGNORED = 0x2FFF,
};

/// @brief Structure holding source and destination operands of the tracked instruction
struct TrackedInstruction {
    instr_obs_t instr_obs;
    // dr_mcontext_t *mc;
    void *dc;

    std::set<tracker_reg_label_t> src_regs;
    std::set<tracker_reg_label_t> dest_regs;
    std::set<tracked_mem_label_t> src_mems;
    std::set<tracked_mem_label_t> dest_mems;
    std::set<tracker_reg_label_t> mem_address_regs;
};

/// @brief Structure tracking all dependencies collected by TaintTracker
struct Dependencies {
    std::map<tracker_reg_label_t, std::set<tracked_label_t>> reg;
    std::map<tracked_mem_label_t, std::set<tracked_label_t>> mem;
};

// =================================================================================================
// Class Definitions
// =================================================================================================

/// @brief Tracking of the input data that impacts contract traces.
///  The algorithm is as follows:
///  - start_instruction: get the static source and destination operands of the instruction
///  - track_memory_access: get dynamic source and destination memory addresses
///  - taint: collect the labels (register names or mem. addresses) that are
///    exposed by this instruction in the contract trace
///  - finalize_instruction:
///    1. propagate the dependencies of the source operands to the destination operands
///    2. update the list of tainted labels with the dependencies of the labels
///       collected by taint_* methods
///  - get_taint: produce an InputTaint object based on the all tainted labels
class TaintTracker
{
  public:
    TaintTracker(const std::string &out_path_, Logger &logger_, Decoder &decode_cache_)
        : logger(logger_), decoder(decode_cache_)
    {
        stream.open(out_path_, std::ios::binary | std::ios::out);
    }
    virtual ~TaintTracker()
    {
        if (stream.is_open())
            stream.close();
    }
    TaintTracker(const TaintTracker &) = delete;
    TaintTracker &operator=(const TaintTracker &) = delete;
    TaintTracker(TaintTracker &&) = delete;
    TaintTracker &operator=(TaintTracker &&) = delete;

    // ---------------------------------------------------------------------------------------------
    // Public Attributes
    bool enabled = false;
    bool tracking_in_progress = false;

    // ---------------------------------------------------------------------------------------------
    // Public Methods (state management)

    /// @brief Enable the taint tracker
    virtual void enable();

    /// @brief Disable the taint tracker and store the collected taints to out_path file
    virtual void finalize();

    /// @brief Save the current state of the taint tracker
    /// @param include_current_inst Whether to include the currently-tracked instruction in the
    ///        checkpoint. (This is currently unused; will be necessary in the future, when
    ///        implementing more complex contracts)
    /// @return void
    virtual void checkpoint(bool include_current_inst);

    /// @brief Restore the state of the taint tracker from the top-most checkpoint
    /// @return void
    virtual void rollback();

    // ---------------------------------------------------------------------------------------------
    // Public Methods (dependency propagation)

    /// @brief Parse instruction and record its static source and destination operands.
    ///        Static means the operands that we can identify without executing the instruction.
    ///        The remaining dynamic operands are collected by track_* methods.
    /// @return void
    virtual void track_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc);

    /// @brief Add the address of the memory access to the list of current instruction dependencies
    virtual void track_memory_access(bool is_write, void *address, uint64_t size);

    // ---------------------------------------------------------------------------------------------
    // Public Methods (tainting)

    /// @brief Taint the operands of a given type for the tracked instruction
    ///        (tracked instruction is the last instruction on which track_instruction was called)
    /// @param value_type The type of the value to taint
    virtual void taint(taint_entry_type_t value_type);

  private:
    // ---------------------------------------------------------------------------------------------
    // Private Attributes

    /// @param stream Output stream for taint entries
    std::ofstream stream;

    /// @param logger Used to log checkpoint and rollback events
    Logger &logger;

    /// @param sandbox_base Base address of the sandbox (stored in R14)
    uint64_t sandbox_base = 0;

    /// @param checkpoints Stack of dependency states for speculation support
    std::vector<Dependencies> checkpoints;

    /// @param tainted_labels Set of labels (register IDs or memory addresses) that are tainted
    std::set<tracked_label_t> tainted_labels;

    /// @param pending_taint Set of labels to be tainted when `finalize` is called
    std::set<tracked_label_t> pending_taint;

    /// @param current_instruction The instruction currently being tracked
    std::unique_ptr<TrackedInstruction> current_instruction;

    /// @param dependencies Current dependency state
    Dependencies dependencies;

    /// @param decoder Shared cache for decoded instructions (reference)
    Decoder &decoder;

    // ---------------------------------------------------------------------------------------------
    // Private Methods

    /// @brief Store all collected taints to the output file
    void store_taints();

    /// @brief Parse instruction operands and populate TrackedInstruction structure
    void parse_instruction_operands(TrackedInstruction *tracked_inst);

    /// @brief Add dependencies from tracked instruction to the global dependency state
    void add_dependencies(const TrackedInstruction *tracked_inst);

    /// @brief Remove overwritten dependencies (for MOV/LEA-like instructions)
    void remove_overwritten_dependencies(const TrackedInstruction *tracked_inst);

    /// @brief Collect all source dependencies from a tracked instruction
    /// @param tracked_inst The instruction to collect dependencies from
    /// @return Set of all labels that the instruction's sources depend on
    std::set<tracked_label_t> collect_source_dependencies(
        const TrackedInstruction *tracked_inst) const;

    /// @brief Propagate source dependencies to a destination in the dependency map
    /// @tparam LabelT The type of label (register or memory)
    /// @param dest_label The destination label to update
    /// @param src_dependencies The source dependencies to propagate
    /// @param dep_map The dependency map to update (either reg or mem)
    template <typename LabelT>
    void propagate_dependencies_to_dest(LabelT dest_label,
                                        const std::set<tracked_label_t> &src_dependencies,
                                        std::map<LabelT, std::set<tracked_label_t>> &dep_map);

    /// @brief Debug: Print the current tainted labels. Should be unused in release builds.
    void dbg_print_taints();

    /// @brief Debug: Print the current dependencies. Should be unused in release builds.
    void dbg_print_dependencies();

    // ---------------------------------------------------------------------------------------------
    // Protected Methods

    /// @brief Propagate dependencies and record the taints of the tracked instruction
    /// @throw dr_abort if called when tracking is not in progress
    void finalize_instruction();
};

/// @brief A no-op implementation of TaintTracker; Used when taint tracking is disabled
class NoneTaintTracker : public TaintTracker
{
  public:
    NoneTaintTracker(const std::string &out_path_, Logger &logger_, Decoder &decode_cache_)
        : TaintTracker(out_path_, logger_, decode_cache_)
    {
    }
    ~NoneTaintTracker() override = default;
    NoneTaintTracker(const NoneTaintTracker &) = delete;
    NoneTaintTracker &operator=(const NoneTaintTracker &) = delete;
    NoneTaintTracker(NoneTaintTracker &&) = delete;
    NoneTaintTracker &operator=(NoneTaintTracker &&) = delete;

    void enable() override {}

    void finalize() override {}

    void checkpoint(bool include_current_inst) override {}

    void rollback() override {}

    void track_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc) override {}

    void track_memory_access(bool is_write, void *address, uint64_t size) override {}

    void taint(taint_entry_type_t value_type) override {}
};


================================================
FILE: rvzr/model_dynamorio/backend/include/tracer_abc.hpp
================================================
///
/// File: Header for the Tracer abstract base class
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_events.h>
#include <drvector.h>

#include "logger.hpp"
#include "observables.hpp"
#include "taint_tracker.hpp"
#include "types/decoder.hpp"
#include "types/file_buffer.hpp"
#include "types/trace.hpp"

using std::uint64_t;

// =================================================================================================
// Class Definition
// =================================================================================================

/// @brief Abstract base class for all tracers
class TracerABC
{
  public:
    TracerABC(const std::string &out_path, Logger &logger, TaintTracker &taint_tracker,
              Decoder &decoder, bool print);
    virtual ~TracerABC();
    TracerABC(const TracerABC &) = delete;
    TracerABC &operator=(const TracerABC &) = delete;
    TracerABC(TracerABC &&) = delete;
    TracerABC &operator=(TracerABC &&) = delete;

    static constexpr const unsigned buf_sz = 8 * 1024;
    /// @param  Buffer containing collected trace entries
    mutable FileBackedBuf<trace_entry_t, buf_sz> trace;

    // ---------------------------------------------------------------------------------------------
    // Public Methods

    /// @brief Starts the tracing process for a wrapped functions
    /// @return void
    virtual void enable();

    /// @brief Finalizes the tracing process for a wrapped function
    /// @return void
    virtual void finalize();

    /// @brief Record per-instruction information on the trace (e.g., its address) as defined
    ///        by the target contract.
    ///        Note: some subclasses may not record any information as the corresponding
    ///        contract may not require it. For such subclasses, this method should be a no-op.
    /// @param instr the observed instruction
    /// @param mc The machine context of the instruction
    /// @param dc The DR context of the instruction
    /// @return void
    virtual void observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc);

    /// @brief Record per-memory access information on the trace (e.g., its address and value)
    ///        as defined by the target contract.
    ///        Note: some subclasses may not record any information as the corresponding
    ///        contract may not require it. For such subclasses, this method should be a no-op.
    /// @param type The type of the memory access (read or write)
    /// @param address The address of the memory access
    /// @param size The size of the memory access
    /// @return void
    virtual void observe_mem_access(bool is_write, void *address, uint64_t size);

    /// @brief Record an architectural exception with a special marker in the trace.
    /// @param siginfo Information about the exception coming from DynamoRIO.
    void observe_exception(dr_siginfo_t *siginfo) const;

  protected:
    // ---------------------------------------------------------------------------------------------
    // Protected Fields
    /// @param If true, the tracer will instrument the instructions in the traced function
    bool tracing_on = false;

    /// @param If true, tracing has been finalized; no more tracing is allowed
    bool tracing_finalized = false;

    /// @param Where to log events for debugging
    Logger &logger;

    /// @brief Used to taint-track dependencies between input values and contract trace
    TaintTracker &taint_tracker;

    /// @brief Shared cache for decoded instructions
    Decoder &decoder;

    // ---------------------------------------------------------------------------------------------
    // Protected Methods

    /// @brief Create an new PC entry and push it on the trace buffer
    ///        This method is meant to be used by observe_instruction if a given contract requires
    ///        recording PCs in the trace.
    /// @param instr The observed instruction
    void record_pc(instr_obs_t instr);

    /// @brief Create an new mem entry and push it on the trace buffer
    ///        This method is meant to be used by observe_mem_access if a given contract requires
    ///        recording memory accesses in the trace.
    /// @param address The address of the memory access
    /// @param size The size of the memory access
    void record_mem_access(bool is_write, void *address, uint64_t size);
};


================================================
FILE: rvzr/model_dynamorio/backend/include/tracers/ct.hpp
================================================
///
/// File: Header for the CT Tracer and its variants
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <dr_api.h> // NOLINT
#include <dr_defines.h>

#include "tracer_abc.hpp"

/// @brief "Constant-Time" (CT) Tracer;
/// This tracer collects addresses of memory accesses and PCs of the executed instructions
class TracerCT : public TracerABC
{
  public:
    using TracerABC::TracerABC;

    /// @brief Record the PC of the executed instruction on the contract trace
    /// @param instr the observed instruction
    /// @param mc unused
    /// @param dc unused
    /// @return void
    void observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc) override;

    /// @brief Record the memory access
    /// @param type The type of the memory access (read or write)
    /// @param address The address of the memory access
    /// @param size The size of the memory access
    /// @param value The value of the memory access
    /// @return void
    void observe_mem_access(bool is_write, void *address, uint64_t size) override;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/tracers/ind.hpp
================================================
///
/// File: Header for the Indirect Call Tracer
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <dr_api.h> // NOLINT
#include <dr_defines.h>

#include "tracer_abc.hpp"

/// @brief Indirect Tracer;
/// This tracer collects target addresses of indirect calls, indirect branches and returns
class TracerInd : public TracerABC
{
  public:
    using TracerABC::TracerABC;

    /// @brief Record the target of the executed indirect call (or branch or ret) on the contract
    /// trace
    /// @param instr the instruction being observed
    /// @param mc the instructions's memory context
    /// @param dc the instructions's DR context
    /// @return void
    void observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc) override;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/tracers/pc.hpp
================================================
///
/// File: Header for the CT Tracer and its variants
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <dr_api.h> // NOLINT
#include <dr_defines.h>

#include "tracer_abc.hpp"

/// @brief "Constant-Time" (CT) Tracer;
/// This tracer collects addresses of memory accesses and PCs of the executed instructions
class TracerPC : public TracerABC
{
  public:
    using TracerABC::TracerABC;

    /// @brief Record the PC of the executed instruction on the contract trace
    /// @param instr the observed instruction
    /// @param mc unused
    /// @param dc unused
    /// @return void
    void observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc) override;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/debug_trace.hpp
================================================
///
/// File: Debug trace entries produced when debugging
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <array>
#include <cstdint>
#include <ostream>

/// @brief Type of entry (single element of a trace)
enum class debug_trace_entry_type_t : uint8_t {
    ENTRY_EOT = 0, // end of trace
    ENTRY_REG_DUMP = 1,
    ENTRY_READ = 2,
    ENTRY_WRITE = 3,
    ENTRY_LOC = 4,
    ENTRY_EXCEPTION = 5,
    ENTRY_CHECKPOINT = 6,
    ENTRY_ROLLBACK = 7,
    ENTRY_ROLLBACK_STORE = 8,
    ENTRY_REG_DUMP_EXTENDED = 9,
};

/// @brief Pretty-printer for trace_entry_type_t
static constexpr const char *to_string(const debug_trace_entry_type_t &type)
{
    switch (type) {
    case debug_trace_entry_type_t::ENTRY_EOT:
        return "EOT";
    case debug_trace_entry_type_t::ENTRY_REG_DUMP:
        return "REG_DUMP ";
    case debug_trace_entry_type_t::ENTRY_READ:
        return "READ ";
    case debug_trace_entry_type_t::ENTRY_WRITE:
        return "WRITE";
    case debug_trace_entry_type_t::ENTRY_LOC:
        return "LOC";
    case debug_trace_entry_type_t::ENTRY_EXCEPTION:
        return "XCPT";
    case debug_trace_entry_type_t::ENTRY_CHECKPOINT:
        return "CHECKPOINT";
    case debug_trace_entry_type_t::ENTRY_ROLLBACK_STORE:
        return "ROLLBACK_STR";
    case debug_trace_entry_type_t::ENTRY_ROLLBACK:
        return "ROLLBACK";
    case debug_trace_entry_type_t::ENTRY_REG_DUMP_EXTENDED:
        return "REG_DUMP2";
    }

    return "UNKNOWN";
}

struct debug_trace_entry_t {
    // What does this entry contain
    debug_trace_entry_type_t type;
    // Nested speculation (0 is architectural)
    uint8_t nesting_level;
    // Unused for now
    uint8_t padding[6]; // NOLINT

    // Union of all possible entry types
    union {
        // ENTRY_REG_DUMP
        struct {
            uint64_t xax;
            uint64_t xbx;
            uint64_t xcx;
            uint64_t xdx;
            uint64_t xsi;
            uint64_t xdi;
            uint64_t pc;
        } regs;
        // ENTRY_REG_DUMP_EXTENDED
        struct {
            uint64_t rsp;
            uint64_t rbp;
            uint64_t flags;
            uint64_t r8;
            uint64_t r9;
            uint64_t r10;
            uint64_t r11;
        } regs_2;
        // ENTRY_MEM (read or write)
        struct {
            uint64_t address;
            uint64_t value;
            uint64_t size;
        } mem;
        // ENTRY_LOC (module name and offset, for disassembly)
        struct {
            uint64_t offset;
            std::array<char, 48> module_name; // NOLINT
        } loc;
        // ENTRY_EXCEPTION
        struct {
            int signal;
            uint64_t address;
        } xcpt;
        // ENTRY_CHECKPOINT
        struct {
            uint64_t rollback_pc;
            uint64_t cur_window_size;
            size_t cur_store_log_size;
        } checkpoint;
        // ENTRY_ROLLBACK
        struct {
            unsigned nesting;
            uint64_t rollback_pc;
        } rollback;
        // ENTRY_ROLLBACK_STORE
        struct {
            uint64_t addr;
            uint64_t val;
            size_t size;
            uint64_t nesting_level;
        } rollback_store;
    };

    /// @param Declare a marker to identify traces of this type
    static constexpr char marker = 'D';

    /// @brief Pretty-printer for debug_trace_entry_t
    void dump(std::ostream &out) const
    {
        // Arch or spec
        if (nesting_level == 0)
            out << "[ARCH] ";
        else
            out << "[SPEC_" << std::dec << (uint)nesting_level << "] ";
        // Print entry type
        out << "[" << to_string(type) << "] ";

        // Print content
        switch (type) {
        case debug_trace_entry_type_t::ENTRY_REG_DUMP:
            out << " pc: " << std::hex << regs.pc;
            out << "  (rax: 0x" << std::hex << regs.xax;
            out << " rbx: 0x" << std::hex << regs.xbx;
            out << " rcx: 0x" << std::hex << regs.xcx;
            out << " rdx: 0x" << std::hex << regs.xdx;
            out << " rsi: 0x" << std::hex << regs.xsi;
            out << " rdi: 0x" << std::hex << regs.xdi << ")";
            break;

        case debug_trace_entry_type_t::ENTRY_LOC:
            for (const char name_char : loc.module_name) {
                if (name_char == '\0')
                    break;
                out << name_char;
            }
            out << "+0x" << std::hex << loc.offset;
            break;

        case debug_trace_entry_type_t::ENTRY_READ:
        case debug_trace_entry_type_t::ENTRY_WRITE:
            out << " addr: " << std::hex << mem.address;
            out << "  val: " << std::hex << mem.value;
            out << "  (sz: " << std::dec << mem.size << ")";
            break;

        case debug_trace_entry_type_t::ENTRY_EXCEPTION:
            out << " sig: " << std::dec << xcpt.signal;
            out << "  addr: " << std::hex << xcpt.address;
            break;

        case debug_trace_entry_type_t::ENTRY_EOT:
            out << "---- END OF TRACE ----\n";
            break;
        case debug_trace_entry_type_t::ENTRY_CHECKPOINT:
            out << " rollback_pc: " << std::hex << checkpoint.rollback_pc;
            out << " (storelog_sz: " << std::dec << checkpoint.cur_store_log_size;
            out << " window_sz: " << std::dec << checkpoint.cur_window_size << ")";
            break;
        case debug_trace_entry_type_t::ENTRY_ROLLBACK:
            out << " rollback_pc: " << std::hex << rollback.rollback_pc;
            out << " (nesting: " << std::dec << rollback.nesting << ")";
            break;

        case debug_trace_entry_type_t::ENTRY_ROLLBACK_STORE:
            out << " addr: 0x" << std::hex << rollback_store.addr;
            out << " val: 0x" << std::hex << rollback_store.val;
            out << " (sz: " << std::dec << rollback_store.size;
            out << " nesting: " << std::dec << rollback_store.nesting_level << ")";
            break;
        case debug_trace_entry_type_t::ENTRY_REG_DUMP_EXTENDED:
            out << " rsp: 0x" << std::hex << regs_2.rsp;
            out << " rbp: 0x" << std::hex << regs_2.rbp;
            out << " flags: 0x" << std::hex << regs_2.flags;
            out << " r8: 0x" << std::hex << regs_2.r8;
            out << " r9: 0x" << std::hex << regs_2.r9;
            out << " r10: 0x" << std::hex << regs_2.r10;
            out << " r11: 0x" << std::hex << regs_2.r11;
            break;
        }

        out << "\n";
    }
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/decoder.hpp
================================================
///
/// File: Instruction Decoder
///       Decodes and caches DynamoRIO instructions to avoid redundant decoding
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <unordered_map>

#include <dr_api.h>      // NOLINT
#include <dr_ir_instr.h> // NOLINT
#include <dr_ir_utils.h> // NOLINT

/// @brief Cached entry containing decoded instruction and next PC
struct CachedInstr {
    instr_noalloc_t instr;
    byte *next_pc;
};

/// @brief Decoder for DynamoRIO instructions with caching
///
/// This class decodes instructions and caches them indexed by their program counter (PC).
/// Instructions are stored as instr_noalloc_t objects, which handle their own cleanup
/// automatically, eliminating the need for manual memory management.
/// The cache also stores the next PC (address after the instruction) for efficient
/// sequential access.
///
/// Usage:
///   Decoder decoder;
///   instr_t *instr = decoder.get_decoded_instr(drcontext, pc);
///   byte *next_pc = decoder.get_next_pc(drcontext, pc);
///   decoder.clear(); // Clear when done
class Decoder
{
  public:
    Decoder() = default;
    ~Decoder() { clear(); }

    // Delete copy/move constructors and assignment operators
    Decoder(const Decoder &) = delete;
    Decoder &operator=(const Decoder &) = delete;
    Decoder(Decoder &&) = delete;
    Decoder &operator=(Decoder &&) = delete;

    /// @brief Get a decoded instruction from cache or decode and cache it
    /// @param drcontext DynamoRIO context
    /// @param pc Program counter of the instruction
    /// @return Pointer to the decoded instruction
    /// @throw dr_abort if decoding fails
    instr_t *get_decoded_instr(void *drcontext, byte *pc)
    {
        // NOLINTNEXTLINE(misc-const-correctness) ; False Positive
        CachedInstr &cached_entry = cache_access(drcontext, pc);
        instr_noalloc_t *noalloc = &cached_entry.instr;
        return instr_from_noalloc(noalloc);
    }

    /// @brief Get the next PC (address after the instruction) from cache or decode and cache it
    /// @param drcontext DynamoRIO context
    /// @param pc Program counter of the instruction
    /// @return The next PC (address immediately following the instruction)
    /// @throw dr_abort if decoding fails
    byte *get_next_pc(void *drcontext, byte *pc)
    {
        const CachedInstr &cached_entry = cache_access(drcontext, pc);
        return cached_entry.next_pc;
    }

    /// @brief Clear the instruction cache
    void clear()
    {
        // Note: instr_noalloc_t destructor handles cleanup automatically
        cache.clear();
    }

    /// @brief Get the number of cached instructions
    /// @return Number of cached instructions
    [[nodiscard]] size_t size() const { return cache.size(); }

    /// @brief Check if the cache is empty
    /// @return True if cache is empty
    [[nodiscard]] bool empty() const { return cache.empty(); }

  private:
    /// @brief Cache of decoded instructions and their next PCs, indexed by PC
    std::unordered_map<byte *, CachedInstr> cache;

    /// @brief Access cached entry by PC. If not present, creates a new entry.
    /// @param pc Program counter of the instruction
    /// @return Reference to the cached instruction entry
    CachedInstr &cache_access(void *drcontext, byte *pc)
    {
        // Cache hit
        auto it = cache.find(pc);
        if (it != cache.end()) {
            return it->second;
        }

        // Cache miss - create new entry
        CachedInstr &cached_entry = cache[pc];
        instr_noalloc_init(drcontext, &cached_entry.instr);
        instr_t *instr = instr_from_noalloc(&cached_entry.instr);

        byte *next_pc = decode(drcontext, pc, instr);
        if (next_pc == nullptr) {
            // Decode failed - remove from cache and abort
            cache.erase(pc);
            dr_printf("[ERROR] Decoder: Failed to decode instruction at PC %p\n", (void *)pc);
            dr_abort();
        }

        // Cache the next_pc
        cached_entry.next_pc = next_pc;

        return cached_entry;
    }
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/file_buffer.hpp
================================================
///
/// File: A buffer that gets automatically spilled to a file when it becomes too big
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include "dr_api.h"
#include "dr_tools.h"

#include <array>
#include <cstdint>
#include <fstream>
#include <iostream>
#include <sstream>

/// @brief A buffer backed by a file: once the buffer reaches a given threshold, it gets
/// automatically spilled into the backing file. Entries can only be appended to the buffer.
/// @tparam T All entries pushed to the buffer have this type.
/// @tparam BufSize Threshold for the buffer.
template <typename T, unsigned BufSize> class FileBackedBuf
{
    // An exact number of entries of type T should fit in the buffer
    static_assert(BufSize % sizeof(T) == 0,
                  "[ASSERT] FileBackedBuf size must fit an exact number of elements");

  private:
    static constexpr const unsigned max_elems = BufSize / sizeof(T);
    unsigned n_elems = 0;
    std::array<T, max_elems> buf;
    std::ofstream stream;
    std::string filename;

    const bool print;

  public:
    FileBackedBuf(bool print) : print(print) {}
    ~FileBackedBuf()
    {
        if (stream.is_open())
            stream.close();
    }
    FileBackedBuf(const FileBackedBuf &) = delete;
    FileBackedBuf(FileBackedBuf &&) = delete;
    FileBackedBuf &operator=(const FileBackedBuf &other) = delete;
    FileBackedBuf &operator=(FileBackedBuf &&other) = delete;

    /// @brief Open the backing ostream and print the header
    /// @param filename Path of backing file
    void open(const std::string &filename_)
    {
        if (stream.is_open())
            return;

        // Open the backing stream
        filename = filename_;
        stream.open(filename_, std::ios::binary | std::ios::out);

        // Write header so that the parser knows which type of trace we are generating
        char marker = T::marker;
        stream.write(&marker, 1);

        // pad the header to 8 bytes for readability
        const char padding[7] = {0, 0, 0, 0, 0, 0, 0}; // NOLINT
        stream.write(padding, 7);                      // NOLINT
    }

    /// @brief Flush the current buffer contents into the backing file
    /// TODO: this could be made asynchronous
    void flush()
    {
        uint32_t n_bytes = n_elems * sizeof(T);
        stream.write(reinterpret_cast<const char *>(buf.data()), n_bytes);
        n_elems = 0;
    }

    /// @brief Append an element to the buffer
    /// @param elem The element to add
    void push_back(const T &elem)
    {
        buf[n_elems] = elem;
        n_elems++;

        if (print) {
            const std::string entry_str;
            std::stringstream entry_stream(entry_str);
            elem.dump(entry_stream);
            dr_printf("%s", entry_stream.str().c_str());
        }

        if (n_elems == max_elems)
            flush();
    }

    /// @brief Close the backing ostream
    void clear()
    {
        if (not stream.is_open())
            return;

        flush();
        stream.close();
    }

    /// @brief Get the name of the backing file
    const std::string &get_filename() const { return filename; }
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/input_taint.hpp
================================================
///
/// File: Class representing the taints collected by TaintTracker class
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>
#include <cstdio>
#include <fstream>
#include <iostream>
#include <vector>

/// @brief Type of trace entries that can be observed
enum class taint_entry_type_t : uint8_t {
    TAINT_ENTRY_EOT = 0, // end of trace
    TAINT_ENTRY_PC = 1,
    TAINT_ENTRY_MEM = 2,
};

/// @brief An entry of an observed taint trace
typedef struct taint_entry_t {
    taint_entry_type_t type;
    uint64_t value;
} taint_entry_t;

/// @brief Class that acts as a container for taint info collected by TaintTracker class.
///        Partially implements std::vector interface
class InputTaint
{
  public:
    InputTaint() = default;
    ~InputTaint() = default;
    InputTaint(const InputTaint &) = delete;
    InputTaint &operator=(const InputTaint &) = delete;
    InputTaint(InputTaint &&) = delete;
    InputTaint &operator=(InputTaint &&) = delete;

    // ---------------------------------------------------------------------------------------------
    // Public Methods

    /// @brief Implement std::vector::push_back
    void push_back(const taint_entry_t &entry) { entries.push_back(entry); }
    /// @brief Implement std::vector::size
    [[nodiscard]] size_t size() const { return entries.size(); }
    /// @brief Implement std::vector::empty
    [[nodiscard]] bool empty() const { return entries.empty(); }

    /// @brief Iterator access operator
    taint_entry_t operator[](size_t index) const { return entries[index]; }

    /// @brief [Non-vector method] Store input taints into a file
    /// @param file_path Path to the output file
    void store_to_file(const char *file_path)
    {
        std::ofstream stream;
        stream.open(file_path, std::ios::binary | std::ios::out);

        // Write all collected entries
        for (const auto &entry : entries) {
            stream.write(reinterpret_cast<const char *>(&entry.type), sizeof(uint8_t));
            stream.write(reinterpret_cast<const char *>(&entry.value), sizeof(uint64_t));
        }

        // Write end-of-trace marker
        auto eot = static_cast<uint8_t>(taint_entry_type_t::TAINT_ENTRY_EOT);
        auto eot_value = 0ULL;
        stream.write(reinterpret_cast<const char *>(&eot), sizeof(uint8_t));
        stream.write(reinterpret_cast<const char *>(&eot_value), sizeof(uint64_t));

        stream.close();
    };

  private:
    // ---------------------------------------------------------------------------------------------
    // Private Attributes
    std::vector<taint_entry_t> entries;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/store_log.hpp
================================================

///
/// File: Class representing a log of store operations performed during speculation.
///       Used to be able to undo memory writes upon rollback.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstddef>
#include <cstdint>
#include <vector>

typedef struct {
    uint64_t addr;
    uint64_t val;
    size_t size;
    unsigned int nesting_level;
} store_log_entry_t;

/// @brief The StoreLog is a wrapper around an std::vector of store_log_entries that keeps track of
/// which entries have been committed and which entries are in-flight. This is needed since we
/// populate the store_log before actually executing the instruction, which might fail.
class StoreLog
{
  public:
    StoreLog() = default;
    ~StoreLog() = default;
    StoreLog(const StoreLog &) = delete;
    StoreLog(StoreLog &&) = delete;
    StoreLog &operator=(const StoreLog &) = delete;
    StoreLog &operator=(StoreLog &&) = delete;

    /// @brief Implement std::vector::back
    [[nodiscard]] const store_log_entry_t &back() const { return entries.back(); }
    /// @brief Implement std::vector::pop_back. This will also update the committed state.
    void pop_back()
    {
        const bool was_committed_entry = (entries.size() == last_committed);
        entries.pop_back();

        if (was_committed_entry)
            last_committed -= 1;
    }
    /// @brief Implement std::vector::push_back
    void push_back(const store_log_entry_t &entry) { entries.push_back(entry); }
    /// @brief Implement std::vector::size
    [[nodiscard]] size_t size() const { return entries.size(); }
    /// @brief Implement std::vector::empty
    [[nodiscard]] bool empty() const { return entries.empty(); }

    /// @brief The last instruction actually committed: mark all entries as committed.
    void update_committed() { last_committed = entries.size(); }
    /// @brief Check if the instruction has any in-flight entries.
    [[nodiscard]] bool has_uncommitted() const { return entries.size() > last_committed; }
    /// @brief Remove all uncommitted entries from the store_log.
    void flush_uncommitted()
    {
        while (has_uncommitted())
            pop_back();
    }

  private:
    std::vector<store_log_entry_t> entries;
    size_t last_committed = 0;
};


================================================
FILE: rvzr/model_dynamorio/backend/include/types/trace.hpp
================================================
///
/// File: Trace entries generated by the tracer
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstdint>
#include <ostream>

/// @brief Type of trace entries that can be observed
enum class trace_entry_type_t : uint8_t {
    ENTRY_EOT = 0, // end of trace
    ENTRY_PC = 1,
    ENTRY_READ = 2,
    ENTRY_WRITE = 3,
    ENTRY_EXCEPTION = 4,
    ENTRY_IND = 5,
};

/// @brief Pretty-printer for trace_entry_type_t
static constexpr const char *to_string(const trace_entry_type_t &type)
{
    switch (type) {
    case trace_entry_type_t::ENTRY_EOT:
        return "EOT";
    case trace_entry_type_t::ENTRY_PC:
        return "PC";
    case trace_entry_type_t::ENTRY_READ:
        return "READ";
    case trace_entry_type_t::ENTRY_WRITE:
        return "WRITE";
    case trace_entry_type_t::ENTRY_EXCEPTION:
        return "XCPT";
    case trace_entry_type_t::ENTRY_IND:
        return "IND";
    }

    return "UNKNOWN";
}

/// @brief An entry of an observed trace
struct trace_entry_t {
    // pc for instructions; address for memory accesses; target for indirect calls
    uint64_t addr;
    // instruction size for instructions; memory access size for memory accesses
    uint32_t size;
    // see trace_entry_type_t
    trace_entry_type_t type;
    // unused for now
    uint8_t padding[3]; // NOLINT

    /// @brief Declare a marker to identify traces of this type
    static constexpr char marker = 'T';

    /// @brief Pretty-printing for tracer output
    void dump(std::ostream &out) const
    {
        out << "[" << to_string(type) << "]";

        switch (type) {
        case trace_entry_type_t::ENTRY_EOT:
            out << "---- END OF TRACE ----\n";
            break;
        case trace_entry_type_t::ENTRY_PC:
            out << " pc: " << std::hex << addr;
            out << "  (instr sz: " << std::dec << size << ")";
            break;
        case trace_entry_type_t::ENTRY_READ:
        case trace_entry_type_t::ENTRY_WRITE:
            out << " addr: " << std::hex << addr;
            out << "  (sz: " << std::dec << size << ")";
            break;
        case trace_entry_type_t::ENTRY_EXCEPTION:
            out << " faulty_addr: " << std::hex << addr;
            out << "  (sig: " << std::dec << size << ")";
            break;
        case trace_entry_type_t::ENTRY_IND:
            out << "  --> target: " << std::hex << addr;
            break;
        }

        out << "\n";
    }
};


================================================
FILE: rvzr/model_dynamorio/backend/include/util.hpp
================================================
///
/// File: Helper functions for DR model
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#pragma once

#include <cstddef>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h> // NOLINT
#include <drvector.h>

#include "observables.hpp"
#include "types/decoder.hpp"

#define INSERT_BEFORE instrlist_meta_preinsert

/// @brief A wrapper around drreg_reserve_register that aborts on failure
/// @param drcontext The drcontext of the current thread
/// @param ilist Current instruction list
/// @param where Current instruction
/// @param permitted The set of registers that can be reserved
/// @param [out] reg The reserved register
/// @return void
void reserve_register_checked(void *drcontext, instrlist_t *ilist, instr_t *where,
                              drvector_t *permitted, DR_PARAM_OUT reg_id_t *reg);

/// @brief A wrapper around drreg_reserve_register that aborts on failure
/// @param drcontext The drcontext of the current thread
/// @param ilist Current instruction list
/// @param where Current instruction
/// @param reg The register to unreserve
/// @return void
void unreserve_register_checked(void *drcontext, instrlist_t *ilist, instr_t *where, reg_id_t reg);

/// @brief Write to the given addres ignoring any permission check.
/// NOTE: Writing to executable memory might clash with DynamoRIO's code cache, use with caution.
/// @param addr address to write to
/// @param size size of the write
/// @param val pointer to the value to write
/// @param w_size number of bytes written is stored here (see dr_safe_write)
/// @return true if the write was successfull
bool force_write(byte *addr, size_t size, const uint64_t *val, size_t *w_size);

/// @brief Check if an instruction is an indirect call or return to an illegal instruction.
///        This has to be called from _within_ the dispatcher's clean_call to make sure that the
///        runtime value of the target is known.
/// NOTE: On illegal jumps to non-executable memory, DynamoRIO will still fetch the corresponding
///       basic block and mark it as DR_MEMPROT_PRETEND_WRITE, which forbids writing to it from a
///       clean call. This is problematic for rollbacks, as speculative code might be jumping to
///       non-executable pages that we need to rollback after the speculation ends.
/// NOTE: This operation is not cheap, use with caution.
/// @param instr The instruction to check
/// @param mc
/// @param dc
bool is_illegal_jump(instr_obs_t instr, dr_mcontext_t *mc, void *dc, Decoder &decoder);

/// @brief Flush dynamorio's basic-block cache. This is needed when transitioning from
/// non-instrumented code to instrumented code, as any shared code (e.g. libc) might be cached and
/// therefore inaccessible for instrumentation.
void flush_bb_cache();


================================================
FILE: rvzr/model_dynamorio/backend/logger.cpp
================================================
///
/// File: Implementation for logger
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cassert>
#include <cstdint>
#include <cstring>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_events.h>
#include <dr_ir_instr.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h>
#include <dr_tools.h>

#include "logger.hpp"

// =================================================================================================
// Local helper functions
// =================================================================================================

static std::pair<std::string, size_t> get_module(uint64_t pc)
{
    module_data_t *mod = dr_lookup_module((byte *)pc);
    if (mod == nullptr)
        return {"Unknown Module", 0};

    // Calculate the offset from the beginning of the module.
    auto offset = (size_t)(pc - (pc_t)mod->start);

    // Get the name of the current module.
    std::string module_name(mod->full_path);

    // If the name is too long, get only the last part.
    const size_t max_path_size = sizeof(debug_trace_entry_t::loc.module_name) - 1;
    if (module_name.size() > max_path_size)
        module_name = module_name.substr(module_name.size() - max_path_size - 1, max_path_size);

    dr_free_module_data(mod);
    return {module_name, offset};
}

/// @brief convert an integer of src_type into a smaller dst_type, saturating the value if needed.
template <typename dst_type, typename src_type>
static constexpr dst_type saturate_cast(const src_type &val)
{
    if (val > std::numeric_limits<dst_type>::max())
        return std::numeric_limits<dst_type>::max();

    return (dst_type)val;
}

// =================================================================================================
// Constructors and Destructors
// =================================================================================================

Logger::Logger(const std::string &logs_path, log_level_t log_level, bool print)
    : log_level(log_level), log(print), cur_nesting_level(0)
{
    if (is_enabled())
        log.open(logs_path);
}

Logger::~Logger() { log.clear(); }

// =================================================================================================
// Public methods
// =================================================================================================

const std::string &Logger::get_filename() const { return log.get_filename(); }

void Logger::close() { log.clear(); }

// =================================================================================================
// Logging methods
// =================================================================================================

void Logger::log_instruction(instr_obs_t instr, dr_mcontext_t *mc, unsigned int nesting_level)
{
    if (not is_enabled())
        return;

    // Set the nesting level for all the entries until the next instruction
    cur_nesting_level = saturate_cast<uint8_t>(nesting_level);
    // Log PC and registers
    log.push_back({.type = debug_trace_entry_type_t::ENTRY_REG_DUMP,
                   .nesting_level = cur_nesting_level,
                   .regs{
                       .xax = mc->xax,
                       .xbx = mc->xbx,
                       .xcx = mc->xcx,
                       .xdx = mc->xdx,
                       .xsi = mc->xsi,
                       .xdi = mc->xdi,
                       .pc = instr.pc,
                   }});
    // Log more registers
    log.push_back({.type = debug_trace_entry_type_t::ENTRY_REG_DUMP_EXTENDED,
                   .nesting_level = cur_nesting_level,
                   .regs_2{
                       .rsp = mc->rsp,
                       .rbp = mc->rbp,
                       .flags = mc->xflags,
                       .r8 = mc->r8,
                       .r9 = mc->r9,
                       .r10 = mc->r10,
                       .r11 = mc->r11,
                   }});
    // Optionally, output each instruction's module and location to aid disassembly
    if (log_level >= LOG_DISASM) {
        // Recover module name from DynamoRIO
        const auto &[module_name, offset] = get_module(instr.pc);
        assert(module_name.size() <= sizeof(debug_trace_entry_t::loc.module_name));

        debug_trace_entry_t loc_entry = {.type = debug_trace_entry_type_t::ENTRY_LOC,
                                         .nesting_level = cur_nesting_level,
                                         .loc{
                                             .offset = offset,
                                             .module_name = {'\0'},
                                         }};
        // Move the recovered module name into the corresponding member of the entry
        std::move(module_name.begin(), module_name.end(), loc_entry.loc.module_name.begin());
        log.push_back(loc_entry);
    }
}

void Logger::log_mem_access(bool is_write, void *address, uint64_t size)
{
    if (not is_enabled())
        return;

    auto cur_address = (uint64_t)address;
    uint64_t remaining_size = size;

    // Vector instructions can read/write more that 64-bits: translate these cases into multiple
    // 64-bit entries.
    while (remaining_size > 0) {
        const uint64_t cur_size = std::min(remaining_size, sizeof(uint64_t));

        // Magic value that marks failed reads in the log.
        const uint64_t marker = 0xDEADBEEFDEADBEEF;
        // Read current memory value.
        uint64_t val = marker;
        size_t r_size = marker;
        const bool success = dr_safe_read((byte *)cur_address, cur_size, &val, &r_size);

        log.push_back({.type = is_write ? debug_trace_entry_type_t::ENTRY_WRITE
                                        : debug_trace_entry_type_t::ENTRY_READ,
                       .nesting_level = cur_nesting_level,
                       .mem{
                           .address = cur_address,
                           .value = val,
                           .size = size,
                       }});

        cur_address += cur_size;
        remaining_size -= cur_size;
    }
}

void Logger::log_exception(dr_siginfo_t *siginfo)
{
    if (not is_enabled())
        return;

    log.push_back({.type = debug_trace_entry_type_t::ENTRY_EXCEPTION,
                   .nesting_level = cur_nesting_level,
                   .xcpt{
                       .signal = siginfo->sig,
                       .address = (uint64_t)siginfo->access_address,
                   }});
}

void Logger::log_checkpoint(pc_t rollback_pc, uint64_t cur_window_size, size_t cur_store_log_size)
{
    if (log_level < LOG_SPEC)
        return;

    log.push_back({.type = debug_trace_entry_type_t::ENTRY_CHECKPOINT,
                   .nesting_level = cur_nesting_level,
                   .checkpoint{
                       .rollback_pc = rollback_pc,
                       .cur_window_size = cur_window_size,
                       .cur_store_log_size = cur_store_log_size,
                   }});
}

void Logger::log_rollback(unsigned nesting, pc_t rollback_pc)
{
    if (log_level < LOG_SPEC)
        return;

    log.push_back({.type = debug_trace_entry_type_t::ENTRY_ROLLBACK,
                   .nesting_level = cur_nesting_level,
                   .rollback{
                       .nesting = nesting,
                       .rollback_pc = rollback_pc,
                   }});
}

void Logger::log_rollback_store(uint64_t addr, uint64_t val, size_t size, uint64_t nesting_level)
{
    if (log_level < LOG_SPEC)
        return;

    log.push_back({.type = debug_trace_entry_type_t::ENTRY_ROLLBACK_STORE,
                   .nesting_level = cur_nesting_level,
                   .rollback_store{
                       .addr = addr,
                       .val = val,
                       .size = size,
                       .nesting_level = nesting_level,
                   }});
}

void Logger::log_eot()
{
    if (not is_enabled())
        return;

    log.push_back({.type = debug_trace_entry_type_t::ENTRY_EOT});
}


================================================
FILE: rvzr/model_dynamorio/backend/model.cpp
================================================
///
/// File: DynamoRIO client entry point and instrumentation orchestrator
///
/// This file implements the main DynamoRIO client (dr_client_main) and coordinates
/// the instrumentation lifecycle. The file is responsible for detecting when to start/stop
/// instrumentation of the target function based on its name. It also registers event callbacks
/// for module loading, basic block transformation, and instruction-level instrumentation.
/// The callbacks transfer control to the Dispatcher class, which manages the rest of
/// the model's logic.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstddef>
#include <cstdio>
#include <cstdlib>
#include <stdexcept>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_events.h>
#include <dr_tools.h>
#include <drmgr.h>
#include <drsyms.h>
#include <drutil.h>
#include <drwrap.h>
#include <drx.h>

#include "cli.hpp"
#include "dispatcher.hpp"
#include "factory.hpp"
#include "util.hpp"

using std::size_t;
using std::string;

/// @brief Pointer to the dispatcher instance;
/// @note We have to use a global pointer to share state (tracer, speculator, state of the
///       instrumentation) with the callbacks. This is the reason for NOLINT as well.
std::unique_ptr<Dispatcher> glob_dispatcher = nullptr; // NOLINT

namespace dr_model
{

static void dr_model_del() noexcept;

// =================================================================================================
// State machine of instrumentation
// =================================================================================================

/// @brief Class holding information about the function to instrument and managing the state of the
/// instrumentation process.
class InstrumentationStateMachine
{
  public:
    InstrumentationStateMachine(std::string name_) : name(std::move(name_)) {}
    ~InstrumentationStateMachine() = default;
    InstrumentationStateMachine(const InstrumentationStateMachine &) = delete;
    InstrumentationStateMachine &operator=(const InstrumentationStateMachine &) = delete;
    InstrumentationStateMachine(InstrumentationStateMachine &&) = delete;
    InstrumentationStateMachine &operator=(InstrumentationStateMachine &&) = delete;

    /// @brief Name of the function to instrument
    std::string name;

    /// @brief Whether DynamoRIO is currently executing inside the instrumented function.
    bool in_function = false;

    void register_entry_pc(app_pc pc)
    {
        DR_ASSERT_MSG(not entry_found, "Function entry pc already registered");
        entry_pc = pc;
        entry_found = true;
    }

    bool is_entry_pc(byte const *pc) const { return entry_found and pc == entry_pc; }

    void register_exit_pc(app_pc pc)
    {
        DR_ASSERT_MSG(not exit_found, "Function exit pc already registered");
        exit_pc = pc;
        exit_found = true;
    }

    bool is_exit_pc(byte const *pc) const { return exit_found and pc == exit_pc; }

    /// @return true on first call (to trigger code cache flush, which will cause re-execution),
    ///         false afterwards
    bool start_instrumentation(void *drcontext)
    {
        DR_ASSERT_MSG(in_function == false,
                      "[ERROR] Recursive calls to the instrumented function are not supported.");
        in_function = true;

        // Flush all code cache: we might want to instrument basic blocks that have already
        // been translated (e.g. libc)
        if (not entry_flush_done) {
            flush_bb_cache();
            entry_flush_done = true;
            in_function = false;

            // quick return: the flush will cause a re-instrumentation, so this function will be
            // called again immediately after this return
            return true;
        }

        // If this is the first time we instrument the function, we need to initialize the
        // dispatcher and store the function's return address for later instrumentation.
        if (not glob_dispatcher->is_initialized) {
            glob_dispatcher->start();
        } else {
            glob_dispatcher->restart();
        }

        // Also, if this is the first time we instrument the function, we have to
        // identify the exit pc by inspecting the return address on the stack
        // (we assume that the function is always called from the same location, hence
        // this is done only once)
        if (not exit_found) {
            dr_mcontext_t mc = {sizeof(mc), DR_MC_ALL};
            dr_get_mcontext(drcontext, &mc);
            exit_found = true;
            exit_pc = *((app_pc *)mc.xsp);
        }
        return false;
    }

    void end_instrumentation(void *drcontext, instrlist_t *bb, instr_t *instr)
    {
        DR_ASSERT_MSG(in_function == true,
                      "[ERROR] Found function exit pc while not in the function.");
        in_function = false;
        glob_dispatcher->instrument_exit(drcontext, bb, instr);
    }

  private:
    /// @brief First pc executed when entering the instrumented function. This is populated
    /// dynamically by `event_module_load` based on symbol resolution.
    app_pc entry_pc = nullptr;
    /// @brief Whether the function entry point has been found.
    bool entry_found = false;
    /// @brief The first time the entry point is executed, we flush the code cache, but only once.
    /// This flag tracks whether we already did it.
    bool entry_flush_done = false;
    /// @brief First pc executed after the instrumented function. This is populated dynamically once
    /// we reach a call to the instrumented function by inspecting the return address on the stack.
    app_pc exit_pc = nullptr;
    /// @brief Whether the function exit point has been found at least once.
    /// @note Currently we assume that the exit point is always the same, that is the function
    ///       is always called by the same instruction.
    bool exit_found = false;
};

/// @brief State machine instance
/// @note We have to use a global pointer since it is the only way to make it accessible from
///       DynamoRIO callbacks. This is the reason for NOLINT as well.
/// NOLINTNEXTLINE(cppcoreguidelines-avoid-non-const-global-variables)
static std::unique_ptr<InstrumentationStateMachine> instrumentation_state_machine = nullptr;

// =================================================================================================
// Event callbacks
// =================================================================================================

/// @brief Callback executed before loading a module.
///        This callback is responsible for detecting the presence of the function to instrument.
///        It checks if the module being loaded contains the function to instrument, and if so,
///        communicates its address to Dispatcher, so that is knows when
///        to start the instrumentation (see `event_instrumentation_start`).
/// @param unused
/// @param module_ Pointer to the module data
/// @param unused
/// @return void
static void event_module_load(void * /*drcontext*/, const module_data_t *module_, bool /*loaded*/)
{
    size_t offset = 0;
    const char *symbol = instrumentation_state_machine->name.c_str();
    const drsym_error_t sym_res =
        drsym_lookup_symbol(module_->full_path, symbol, &offset, DRSYM_DEMANGLE);
    if (sym_res == DRSYM_SUCCESS) {
        instrumentation_state_machine->register_entry_pc(module_->start + offset);
    }
}

/// @brief Callback executed at the first instrumentation stage:
///        application-to-application transformation.
///        The implementation expands string ops and scatter/gather
///        into a sequence of normal memory references.
/// @param drcontext The drcontext of the current thread
/// @param unused
/// @param bb The basic block to be transformed
/// @param unused
/// @param unused
/// @return BB emitted state (dr_emit_flags_t)
static dr_emit_flags_t event_bb_app2app(void *drcontext, void * /*tag*/, instrlist_t *bb,
                                        bool /*for_trace*/, bool /*translating*/)
{
    bool err = false;
    err |= !drutil_expand_rep_string(drcontext, bb);
    err |= !drx_expand_scatter_gather(drcontext, bb, nullptr);
    if (err) {
        dr_printf("ERROR: failed to expand string ops or scatter/gather\n");
        dr_abort();
    }
    return DR_EMIT_DEFAULT;
}

/// @brief Callback executed at the third instrumentation stage: instrumentation insertion.
///        The implementation invokes the Dispatcher::instrument_instruction method for every
///        (post-expanded) instruction in the basic block.
/// @param drcontext The drcontext of the current thread
/// @param unused
/// @param bb Parent basic block
/// @param instr The instruction to instrument
/// @param unused
/// @param unused
/// @param unused
/// @return BB emitted state (dr_emit_flags_t)
static dr_emit_flags_t event_bb_instrumentation(void *drcontext, void * /*tag*/, instrlist_t *bb,
                                                instr_t *instr, bool /*for_trace*/,
                                                bool /*translating*/, void * /*user_data*/)
{
    // disassemble_with_info(drcontext, instr_get_app_pc(org_instr), STDOUT, true, true);
    app_pc instr_pc = instr_get_app_pc(instr);

    if (instrumentation_state_machine->is_entry_pc(instr_pc)) {
        const bool triggers_reexecute =
            instrumentation_state_machine->start_instrumentation(drcontext);
        if (triggers_reexecute) {
            // start_instrumentation triggered a code cache flush, so we return early to re-execute
            return DR_EMIT_DEFAULT;
        }
        // no return here: this is the first instruction of the target function,
        // so we still need to instrument it as all other instructions
    }

    if (instrumentation_state_machine->is_exit_pc(instr_pc)) {
        // We found the end pc: add the corresponding callback
        instrumentation_state_machine->end_instrumentation(drcontext, bb, instr);

        // return early: this instruction is already outside the instrumented function (it's
        // the first instruction after the return), so we don't need to instrument it
        return DR_EMIT_DEFAULT;
    }

    // Add a clean call to the dispatch callback, which will forward the call to the service
    // modules
    return glob_dispatcher->instrument_instruction(drcontext, bb, instr);
}

/// @brief Callback executed upon exceptions
/// @param drcontext The drcontext of the current thread
/// @param excpt Pointer to the exception data
/// @return whether the signal should be redirected or delivered to the application
static dr_signal_action_t event_signal(void *drcontext, dr_siginfo_t *siginfo)
{
    if (glob_dispatcher->handle_exception(drcontext, siginfo)) {
        return DR_SIGNAL_REDIRECT;
    }

    // Continue with the default exception handling if no redirection happened
    return DR_SIGNAL_DELIVER;
}

/// @brief Callback executed before exiting the application.
/// @return void
static void event_exit()
{
    // There is a possibility that the tracing process has not been finalized
    // because the traced function has not been called
    glob_dispatcher->finalize();

    // Make sure we've sent all the collected data
    fflush(stdout);

    // Delete the dispatcher
    glob_dispatcher.reset();

    // Close the DR extensions
    dr_model_del();
}

// =================================================================================================
// Model constructor and destructor
// =================================================================================================

/// @brief Constructor of the DR model.
///        The function initializes the DR extensions and registers callbacks.
/// @return void
/// @throw std::runtime_error if any of the DR extensions fails to start
static void dr_model_init()
{
    // Start DR extensions
    if (!drmgr_init())
        throw std::runtime_error("ERROR: failed to start drmgr\n");
    if (!drutil_init())
        throw std::runtime_error("ERROR: failed to start drutil\n");
    if (!drx_init())
        throw std::runtime_error("ERROR: failed to start drx\n");
    if (!drwrap_init())
        throw std::runtime_error("ERROR: failed to start drwrap\n");
    if (drsym_init(0) != DRSYM_SUCCESS)
        throw std::runtime_error("ERROR: failed to start drsym\n");

    // Register callbacks
    if (!drmgr_register_module_load_event(event_module_load))
        throw std::runtime_error("ERROR: failed to register a callback\n");
    if (!drmgr_register_bb_app2app_event(event_bb_app2app, nullptr))
        throw std::runtime_error("ERROR: failed to register a callback\n");
    if (!drmgr_register_bb_instrumentation_event(nullptr, event_bb_instrumentation, nullptr))
        throw std::runtime_error("ERROR: failed to register a callback\n");

    drmgr_register_signal_event(event_signal);
    dr_register_exit_event(event_exit);
}

/// @brief Destructor of the DR model.
///        The function unregisters callbacks and closes the DR extensions.
/// @return void
void dr_model_del() noexcept
{
    drmgr_unregister_module_load_event(event_module_load);
    drmgr_unregister_bb_app2app_event(event_bb_app2app);
    drmgr_unregister_bb_insertion_event(event_bb_instrumentation);

    drsym_exit();
    drwrap_exit();
    drx_exit();
    drutil_exit();
    drmgr_exit();

    instrumentation_state_machine.reset();
}

} // namespace dr_model

// =================================================================================================
// Model entry point
// =================================================================================================

/// @brief Entry point of the DR model.
///        The function initializes the dispatcher, registers callbacks,
///        and starts the DR extensions.
/// @param _ Unused
/// @param argc Number of CLI arguments
/// @param argv CLI arguments
/// @return void
DR_EXPORT void dr_client_main(client_id_t /* client_id */, int argc, const char **argv)
{
    // Parse CLI arguments
    cli_args_t parsed_args = {};
    parse_cli(argc, argv, parsed_args);

    // Special cases:
    if (parsed_args.list_tracers) {
        for (const auto &tracer_name : get_tracer_list()) {
            dr_printf("%s\n", tracer_name.c_str());
        }
        return;
    }
    if (parsed_args.list_speculators) {
        for (const auto &speculator_name : get_speculator_list()) {
            dr_printf("%s\n", speculator_name.c_str());
        }
        return;
    }

    // Create a dispatcher instance
    glob_dispatcher = std::make_unique<Dispatcher>(&parsed_args);

    // Set the target function
    dr_model::instrumentation_state_machine =
        std::make_unique<dr_model::InstrumentationStateMachine>(parsed_args.instrumented_func);

    // Initialize the DR model
    dr_model::dr_model_init();
}


================================================
FILE: rvzr/model_dynamorio/backend/speculator_abc.cpp
================================================
///
/// File: Abstract interface to be implemented by all speculators.
///       For implementations of concrete speculators, see speculators/*.cpp files.
///
///      A speculator is a component that modifies the execution process of a test case when it
///      runs on the contract model (e.g., it can emulate misprediction of branches).
///      As such, speculators implement execution clauses of different contracts.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <algorithm>
#include <array>
#include <cstdint>

#include <dr_api.h>
#include <dr_ir_opcodes_x86.h>
#include <dr_ir_opnd.h>
#include <dr_os_utils.h>
#include <memory>

#include "dr_events.h"
#include "dr_ir_instr.h"
#include "dr_tools.h"
#include "observables.hpp"
#include "speculator_abc.hpp"
#include "util.hpp"

// =================================================================================================
// Local helper functions
// =================================================================================================

// See Intel Manual https://cdrdv2.intel.com/v1/dl/getContent/671200
// chapter 10.3 - Serializing Instructions.
static constexpr const std::array<uint64_t, 35> serializing_opcodes = {
    // Non-privileged memory-ordering instructions
    OP_lfence, OP_mfence, OP_sfence,
    // Privileged serializing instructions
    // TODO: add MOV CR (except CR8)
    OP_invd, OP_invept, OP_invlpg, OP_invvpid, OP_lgdt, OP_lidt, OP_lldt, OP_ltr, OP_wbinvd,
    OP_wrmsr,
    // Non-privileged serializing instructions
    OP_cpuid, OP_iret, OP_rsm, OP_serialize,
    // TSX/RTM instructions (not tracked by DynamoRIO).
    OP_xbegin, OP_xabort, OP_xend, OP_xtest,
    // XSAVE/XRESTORE instructions (not tracked by DynamoRIO).
    OP_xsave32, OP_xsave64, OP_xsavec32, OP_xsavec64, OP_xsaves32, OP_xsaves64, OP_xsaveopt32,
    OP_xsaveopt64, OP_xrstor32, OP_xrstor64, OP_xrstors32, OP_xrstors64,
    // Other special instructions
    OP_hlt,
    // NOTE: syscalls are not instrumented by Dynamorio, this makes sure that speculation is aborted
    // on speculative syscall instructions.
    OP_syscall};

static bool is_speculation_barrier(const uint64_t opcode)
{
    return std::any_of(serializing_opcodes.begin(), serializing_opcodes.end(),
                       [&opcode](const uint64_t barrier) { return opcode == barrier; });
}

// =================================================================================================
// Public Methods
// =================================================================================================
void SpeculatorABC::enable() { enabled = true; }

void SpeculatorABC::disable() { enabled = false; }

bool SpeculatorABC::skip_speculation() const
{
    if (not enabled)
        return true;
    if (nesting >= max_nesting)
        return true;
    if (spec_window >= max_spec_window)
        return true;
    return false;
}

void SpeculatorABC::checkpoint(dr_mcontext_t *mc, pc_t pc)
{
    // store the register state and the rollback address
    checkpoints.push_back({.rollback_pc = pc, .spec_window = spec_window, .mc = *mc});
    logger.log_checkpoint(pc, spec_window, store_log.size());
    taint_tracker.checkpoint(false);

    // update the state machine that tracks the speculation proces
    in_speculation = true;
    nesting += 1;
}

pc_t SpeculatorABC::rollback(dr_mcontext_t *mc)
{
    // restore the last checkpoint
    if (checkpoints.empty()) {
        dr_printf("[ERROR] SpeculatorABC::rollback: no checkpoints to rollback");
        dr_abort();
    }
    const checkpoint_t checkpoint = checkpoints.back();
    checkpoints.pop_back();
    *mc = checkpoint.mc;
    spec_window = checkpoint.spec_window;

    // undo all store operations performed during speculation
    while (not store_log.empty()) {
        const auto store = store_log.back();

        // Rollback only entries of the last (nested) speculative window
        if (store.nesting_level < nesting)
            break;

        // Try restoring the previous value in memory.
        size_t w_size = 0;
        const bool success = dr_safe_write((byte *)store.addr, store.size, &store.val, &w_size);
        logger.log_rollback_store(store.addr, store.val, w_size, store.nesting_level);

        // The rollback should always be successful.
        // NOTE: The following cases are already handled elsewhere:
        //       1. Rollback of an invalid store.
        //            - stores to non-valid memory are handled by handle_mem_access()
        //            - stores to non-writable memory cause an exception, and their
        //            corresponding entires are flushed by handle_exception()
        //       2. Rollback after faulty indirect call/ret.
        //            - should never be executed, handled by handle_instruction()
        if (not success) {
            // If ignoring permissions does not work, we cannot recover.
            dr_printf("[ERROR] Failed to rollback store -- addr: %lx  val: %lx  sx: %d\n",
                      store.addr, store.val, store.size);
            // Read page protections
            uint prot = -1;
            dr_query_memory((byte *)store.addr, nullptr, nullptr, &prot);
            dr_printf("[ERROR] Page prot 0x%x\n", prot);
            dr_abort();
            return 0; // unreachable
        }
        store_log.pop_back();
    }

    // update the state machine that tracks the speculation process
    nesting -= 1;
    if (nesting <= 0) {
        nesting = 0;
        in_speculation = false;
        if (not checkpoints.empty() or not store_log.empty()) {
            dr_printf("[ERROR] Speculation ended but there are still %d checkpoints and %d "
                      "store logs to consume\n",
                      checkpoints.size(), store_log.size());
            dr_abort();
        }
    }

    taint_tracker.rollback();
    logger.log_rollback(nesting, checkpoint.rollback_pc);
    return checkpoint.rollback_pc;
}

pc_t SpeculatorABC::handle_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    // the last instruction committed: all entries in the store_log are valid
    store_log.update_committed();

    if (not in_speculation)
        return 0;

    // rollback if we hit a speculation barrier
    if (is_speculation_barrier(instr.opcode)) {
        return rollback(mc);
    }

    // rollback if we hit a speculation window limit
    spec_window += 1;
    if (spec_window >= max_spec_window) {
        return rollback(mc);
    }

    // rollback if we're about to jump/ret to an illegal address
    if (is_illegal_jump(instr, mc, dc, decoder)) {
        return rollback(mc);
    }

    return 0;
}

bool SpeculatorABC::handle_mem_access(bool is_write, void *address, uint64_t size)
{
    if (not in_speculation)
        return true;

    if (not is_write)
        return true;

    // record changes made to the memory
    auto cur_address = (uint64_t)address;
    size_t remaining_size = size;

    // The store might be bigger than 64 bits (e.g. vector ops): save 64 bits at a time
    while (remaining_size > 0) {
        const uint64_t cur_size = std::min(remaining_size, sizeof(uint64_t));
        // NOTE: on speculative paths, safe reads are the only way to load from memory, since
        // pointers might be invalid.
        size_t r_size = 0;
        uint64_t val = 0;
        const bool success = dr_safe_read((byte *)cur_address, cur_size, (byte *)&val, &r_size);

        if (not success) {
            // If the memory access is illegal, the store is bound to fail: rollback.
            return false;
        }

        // Save the previous memory value to be restored after speculation
        store_log.push_back({
            .addr = cur_address,
            .val = val,
            .size = cur_size,
            .nesting_level = nesting,
        });

        // Advance until all relevant memory has been saved
        cur_address += cur_size;
        remaining_size -= cur_size;
    }

    return true;
}

static bool is_supported_reg(const reg_id_t reg)
{
    // Some registers cannot be modified from the API, see DynamoRIO NYI i#3504
    return reg_is_gpr(reg) or (reg >= DR_REG_START_XMM && reg <= DR_REG_STOP_XMM) or
           (reg >= DR_REG_START_YMM && reg <= DR_REG_STOP_YMM) or
           (reg >= DR_REG_START_ZMM && reg <= DR_REG_STOP_ZMM);
}

static std::pair<instr_t *, byte *> get_load_inst(void *dc, byte *pc, Decoder &decoder)
{
    // Decode the instruction and get its next PC
    instr_t *cur_instr = decoder.get_decoded_instr(dc, pc);
    byte *next_pc = decoder.get_next_pc(dc, pc);

    // Return a nullptr if it's not a load.
    if (not instr_reads_memory(cur_instr))
        return {nullptr, nullptr};

    return {cur_instr, next_pc};
}

bool SpeculatorABC::handle_exception(void *drcontext, dr_siginfo_t *siginfo)
{
    if (not in_speculation)
        return false; // nothing to do

    // Get faulty instruction's context
    dr_mcontext_t *mc = siginfo->mcontext;

    // Check if we need to poison the destination register. If not, just rollback.
    if (poison_value.has_value()) {
        // Decode the instruction
        const auto [cur_instr, next_pc] = get_load_inst(drcontext, mc->pc, decoder);

        // Forward poison value
        if (cur_instr != nullptr and instr_num_dsts(cur_instr) > 0) {
            // Get the first destination register
            // TODO: what if the instruction has more than one destination register?
            const opnd_t dst = instr_get_dst(cur_instr, 0);
            // TODO: what if the destination is memory?
            if (opnd_is_reg(dst)) {
                reg_id_t reg = opnd_get_reg(dst);
                reg = reg_to_pointer_sized(reg);
                // Not all registers can be written from the API
                if (is_supported_reg(reg)) {
                    // Create a buffer with the repeated poison value
                    constexpr int max_reg_size = 64;
                    constexpr int n_elems = max_reg_size / sizeof(uint64_t);
                    std::array<uint64_t, n_elems> poison_buf = {};
                    std::fill(poison_buf.begin(), poison_buf.end(), poison_value.value());

                    // Set the destination register to the poison value
                    reg_set_value_ex(reg, mc, (uint8_t *)(poison_buf.data()));
                    // Skip to the next instruction
                    // TODO: what if the instruction is supposed to have other side effects?
                    mc->pc = next_pc;
                    return true; // execution was redirected
                }
            }
        }
    }

    // Flush stores that are in-flight (i.e. were performed by the failing instruction)
    store_log.flush_uncommitted();
    // Perform rollback
    const pc_t newpc = rollback(mc);
    mc->pc = (byte *)newpc;

    return true; // execution was redirected
}


================================================
FILE: rvzr/model_dynamorio/backend/speculators/cond.cpp
================================================
///
/// File: Implementation of the Conditional Branch (COND) Speculator
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <optional>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_decode.h>
#include <dr_ir_instr.h>
#include <dr_ir_opcodes_x86.h>

#include "observables.hpp"
#include "speculator_abc.hpp"
#include "speculators/cond.hpp"
#include "types/decoder.hpp"

// =================================================================================================
// Local helper functions
// =================================================================================================

/// @brief Summary of the relevant information for conditional branches
typedef struct {
    pc_t target;
    pc_t fallthrough;
    bool is_loop;
    bool will_jump;
} BranchInfo;

/// @brief If the instruction is a conditional branch return its relevant information, otherwise
/// return an empty option.
static std::optional<BranchInfo> get_branch_info(instr_obs_t instr, dr_mcontext_t *mc, void *dc,
                                                 Decoder &decoder)
{
    // Decode the instruction using the shared cache
    instr_t *cur_instr = decoder.get_decoded_instr(dc, (byte *)instr.pc);

    // Not a branch, return empty option
    if (not instr_is_cbr(cur_instr))
        return {};

    // Get the next PC (fallthrough address) from the cache
    byte *next_pc = decoder.get_next_pc(dc, (byte *)instr.pc);

    // Parse branch information
    return BranchInfo{
        .target = (pc_t)instr_get_branch_target_pc(cur_instr),
        .fallthrough = (pc_t)next_pc,
        .is_loop = instr_is_cti_loop(cur_instr),
        .will_jump = instr_jcc_taken(cur_instr, mc->xflags),
    };
}

// =================================================================================================
// Class implementation
// =================================================================================================

pc_t SpeculatorCond::handle_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    // Handling in the superclass takes priority
    const pc_t next_pc = SpeculatorABC::handle_instruction(instr, mc, dc);
    if (next_pc != 0)
        return next_pc;

    // Check if speculation should be skipped
    if (skip_speculation())
        return 0;

    // Decode the instruction using the shared cache
    const auto &branch_info = get_branch_info(instr, mc, dc, decoder);

    // Skip if not a branch
    if (not branch_info)
        return 0;

    // LOOP instructions must also decrement RCX
    if (branch_info->is_loop)
        mc->rcx -= 1;

    // Simulate misprediction: checkpoint the correct path, speculate the opposite one
    pc_t speculated_pc = 0;
    if (branch_info->will_jump) {
        checkpoint(mc, branch_info->target);
        speculated_pc = branch_info->fallthrough;
    } else {
        checkpoint(mc, branch_info->fallthrough);
        speculated_pc = branch_info->target;
    }

    // Redirect execution to the next speculative instruction
    return speculated_pc;
}


================================================
FILE: rvzr/model_dynamorio/backend/speculators/seq.cpp
================================================
///
/// File: Sequential Tracer; this tracer implements the contract model
///       for the sequential execution of instructions.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "speculator_abc.hpp"
#include "speculators/seq.hpp"

// Nothing here so far; the class identically mirrors the base class

================================================
FILE: rvzr/model_dynamorio/backend/taint_tracker.cpp
================================================
///
/// File: Taint Tracker class
///
/// Performs backward taint analysis during DynamoRIO instrumentation to identify which parts
/// of the test input (registers and memory) influence contract trace observations. Tracks data
/// dependencies through instruction execution, supporting speculative execution via checkpoint/
/// rollback. Used to implement `trace_test_case_with_taints` interface in the DR Model backend,
/// and is therefore tightly coupled with rvzr's InputTaint class.
///
/// The module should only be used when the model is running in `rvzr` mode.
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include "taint_tracker.hpp"

#include <cstdint>
#include <iomanip>
#include <sstream>
#include <string>
#include <unordered_set>

#include <dr_api.h>        // NOLINT
#include <dr_ir_instr.h>   // NOLINT
#include <dr_ir_opcodes.h> // NOLINT
#include <dr_ir_opnd.h>    // NOLINT
#include <dr_ir_utils.h>   // NOLINT

// End-of-taint marker written to taint output file
const uint64_t EOT_MARKER = -1ULL;

// Maximum register ID used by DynamoRIO (register IDs are < 256)
// Used to distinguish register labels from memory address labels
const unsigned MAX_REG_ID = 255;

// Memory tracking granularity and alignment
const uint64_t MEM_TRACKING_GRANULARITY = 8; // Track memory at 8-byte granularity
const uint64_t QWORD_ALIGN_MASK = ~0x7ULL;   // Mask for 8-byte alignment (0xFFFFFFFFFFFFFFF8)

/// @brief Mapping between DynamoRIO EFLAGS bits and our register IDs
struct FlagMapping {
    uint read_flag;
    uint write_flag;
    reg_id_t reg_id;
};

/// @brief Table of all tracked flags
/// NOLINTNEXTLINE(cppcoreguidelines-avoid-c-arrays, modernize-avoid-c-arrays)
static const FlagMapping FLAG_MAPPINGS[] = {
    {EFLAGS_READ_CF, EFLAGS_WRITE_CF, DR_FLAG_CF}, {EFLAGS_READ_PF, EFLAGS_WRITE_PF, DR_FLAG_PF},
    {EFLAGS_READ_AF, EFLAGS_WRITE_AF, DR_FLAG_AF}, {EFLAGS_READ_ZF, EFLAGS_WRITE_ZF, DR_FLAG_ZF},
    {EFLAGS_READ_SF, EFLAGS_WRITE_SF, DR_FLAG_SF}, {EFLAGS_READ_OF, EFLAGS_WRITE_OF, DR_FLAG_OF},
    {EFLAGS_READ_DF, EFLAGS_WRITE_DF, DR_FLAG_DF},
};

/// @brief Set of opcodes that override dependencies (MOV and LEA variants)
static const std::unordered_set<int> OVERRIDE_OPCODES = {
    OP_mov_ld, OP_mov_st, OP_mov_imm, OP_mov_priv, OP_movd,  OP_movq,
    OP_movs,   OP_movsx,  OP_movzx,   OP_movsxd,   OP_movbe, OP_lea,
};

// =================================================================================================
// Helper Functions
// =================================================================================================

/// @brief Normalize register to its 64-bit equivalent for tracking
/// @param reg The register ID
/// @return Normalized register ID
static inline reg_id_t normalize_reg(reg_id_t reg)
{
    // For GPRs, normalize to 64-bit version
    if (reg_is_gpr(reg)) {
        return reg_resize_to_opsz(reg, OPSZ_8);
    }
    return reg;
}

static inline void track_operand(const bool is_src, const opnd_t opnd,
                                 struct TrackedInstruction *tracked_inst)
{
    // Process register operands
    if (opnd_is_reg(opnd)) {
        const reg_id_t reg = normalize_reg(opnd_get_reg(opnd));
        if (reg == DR_REG_NULL) {
            return;
        }
        if (is_src) {
            tracked_inst->src_regs.insert(reg);
        } else {
            tracked_inst->dest_regs.insert(reg);
        }
        return;
    }

    // Non-memory non-register - ignore
    if (not opnd_is_memory_reference(opnd)) {
        return;
    }

    // Base + displacement memory reference
    if (opnd_is_base_disp(opnd)) {
        const reg_id_t base = opnd_get_base(opnd);
        const reg_id_t index = opnd_get_index(opnd);
        if (base != DR_REG_NULL) {
            tracked_inst->mem_address_regs.insert(normalize_reg(base));
        }
        if (index != DR_REG_NULL) {
            tracked_inst->mem_address_regs.insert(normalize_reg(index));
        }
        return;
    }

    // Base-only memory reference
    const reg_id_t base = opnd_get_base(opnd);
    if (base != DR_REG_NULL) {
        tracked_inst->mem_address_regs.insert(normalize_reg(base));
    }
}

static inline void track_flags(const uint eflags, struct TrackedInstruction *tracked_inst)
{
    // Process each flag in the mapping table
    for (const auto &mapping : FLAG_MAPPINGS) {
        if ((eflags & mapping.read_flag) != 0) {
            tracked_inst->src_regs.insert(mapping.reg_id);
        }
        if ((eflags & mapping.write_flag) != 0) {
            tracked_inst->dest_regs.insert(mapping.reg_id);
        }
    }
}

/// @brief Convert DynamoRIO register ID to the encoding expected by rvzr (hardcoded mapping)
/// @param reg
/// @return rvzr register ID
static RVZRRegId dr_reg_id_to_rvzr_reg_id(reg_id_t reg)
{
    // These IDs must match the offsets in the sandbox, as defined in docs/devel/
    switch (reg) {
    case DR_REG_RAX:
        return RVZRRegId::RVZR_REG_RAX;
    case DR_REG_RBX:
        return RVZRRegId::RVZR_REG_RBX;
    case DR_REG_RCX:
        return RVZRRegId::RVZR_REG_RCX;
    case DR_REG_RDX:
        return RVZRRegId::RVZR_REG_RDX;
    case DR_REG_RSI:
        return RVZRRegId::RVZR_REG_RSI;
    case DR_REG_RDI:
        return RVZRRegId::RVZR_REG_RDI;
    case DR_REG_XMM0:
    case DR_REG_YMM0:
        return RVZRRegId::RVZR_REG_XMM0;
    case DR_REG_XMM1:
    case DR_REG_YMM1:
        return RVZRRegId::RVZR_REG_XMM1;
    case DR_REG_XMM2:
    case DR_REG_YMM2:
        return RVZRRegId::RVZR_REG_XMM2;
    case DR_REG_XMM3:
    case DR_REG_YMM3:
        return RVZRRegId::RVZR_REG_XMM3;
    case DR_REG_XMM4:
    case DR_REG_YMM4:
        return RVZRRegId::RVZR_REG_XMM4;
    case DR_REG_XMM5:
    case DR_REG_YMM5:
        return RVZRRegId::RVZR_REG_XMM5;
    case DR_REG_XMM6:
    case DR_REG_YMM6:
        return RVZRRegId::RVZR_REG_XMM6;
    case DR_REG_XMM7:
    case DR_REG_YMM7:
        return RVZRRegId::RVZR_REG_XMM7;
    case DR_FLAG_AF:
    case DR_FLAG_CF:
    case DR_FLAG_DF:
    case DR_FLAG_OF:
    case DR_FLAG_PF:
    case DR_FLAG_SF:
    case DR_FLAG_ZF:
        // All tainted flags map to a single taint ID
        return RVZRRegId::RVZR_REG_FLAGS;
    default:
        // The rest of the registers are not used by rvzr; if they get tainted, this is
        // an artifact of the adaptor, and they should be ignored.
        return RVZRRegId::RVZR_REG_IGNORED;
    }
}

/// @brief Check if an instruction is a 64+ bit MOV-like instruction that overrides dependencies
/// @param tracked_inst The tracked instruction to check
/// @param decoder Decoder for instruction analysis
/// @return true if the instruction overrides dependencies
static bool is_override_instruction(const TrackedInstruction *tracked_inst, Decoder *decoder)
{
    // Only MOV and LEA opcodes override dependencies
    auto opcode = static_cast<int>(tracked_inst->instr_obs.opcode);
    if (OVERRIDE_OPCODES.find(opcode) == OVERRIDE_OPCODES.end()) {
        return false;
    }

    // Skip instructions with more than one destination operand
    if (tracked_inst->dest_regs.size() != 1) {
        return false;
    }

    // Check that the destination register is 64-bit or more
    const reg_id_t dest_reg = *tracked_inst->dest_regs.begin();
    if (reg_is_xmm(dest_reg) || reg_is_ymm(dest_reg)) {
        return true;
    }
    if (reg_is_gpr(dest_reg)) {
        instr_t *instr =
            decoder->get_decoded_instr(tracked_inst->dc, (byte *)tracked_inst->instr_obs.pc);
        const int size = opnd_get_size(instr_get_dst(instr, 0));
        return size == OPSZ_8;
    }
    return false;
}

/// @brief Heuristic to determine if a label represents a register or memory address
/// @param label The label to check
/// @return true if label likely represents a register, false if likely a memory address
/// @note DynamoRIO register IDs are < 256, while memory addresses are much larger.
///       May incorrectly classify low memory addresses (e.g., NULL page) as registers,
///       but this is rare and only affects performance, not correctness.
static bool label_is_reg(tracked_label_t label) { return label <= MAX_REG_ID; }

// =================================================================================================
// Public Methods
// =================================================================================================
void TaintTracker::enable()
{
    DR_ASSERT(not tracking_in_progress);
    enabled = true;
    tracking_in_progress = true;
    sandbox_base = 0; // Will be set on first instruction
}

void TaintTracker::finalize()
{
    if (current_instruction != nullptr) {
        finalize_instruction();
    }

    store_taints();
    enabled = false;
    tracking_in_progress = false;
}

void TaintTracker::checkpoint(bool include_current_inst)
{
    if (not enabled)
        return;

    if (include_current_inst && current_instruction != nullptr) {
        finalize_instruction();
    }

    // Deep copy the dependencies
    checkpoints.push_back(dependencies);
}

void TaintTracker::rollback()
{
    if (not enabled)
        return;
    DR_ASSERT_MSG(not checkpoints.empty(), "TaintTracker::rollback: no checkpoints to rollback");

    if (current_instruction != nullptr) {
        finalize_instruction();
    }

    // Restore dependencies from the last checkpoint
    dependencies = checkpoints.back();
    checkpoints.pop_back();
}

void TaintTracker::track_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    if (not enabled)
        return;

    // Capture sandbox base from R14 on first instruction
    if (sandbox_base == 0 && mc != nullptr) {
        sandbox_base = mc->r14;
    }

    // Finalize the previous instruction
    if (current_instruction != nullptr) {
        finalize_instruction();
    }
    // dr_printf("--------------------------------\n");

    // Create a new tracked instruction
    current_instruction = std::make_unique<TrackedInstruction>();
    current_instruction->instr_obs = instr;
    current_instruction->dc = dc;

    // Parse the instruction operands
    parse_instruction_operands(current_instruction.get());

    // Reset pending taint
    pending_taint.clear();
}

void TaintTracker::track_memory_access(bool is_write, void *address, uint64_t size)
{
    if (not enabled)
        return;
    DR_ASSERT_MSG(current_instruction != nullptr,
                  "TaintTracker::track_memory_access called before track_instruction");

    // The following logic records the memory address into the list of
    // source/destination memory operands
    // The challenge here is that we track memory at 8-byte granularity, and a memory access
    // may span multiple 8-byte blocks (e.g., a YMM store of 32 bytes).

    // 1. Identify the range of 8-byte blocks accessed
    auto addr = (uint64_t)address;
    const uint64_t end_addr = addr + (size - 1);
    const uint64_t range_start = addr & QWORD_ALIGN_MASK;
    const uint64_t range_end = end_addr & QWORD_ALIGN_MASK;

    // 2. Identify whether it's a read or write, and add to the appropriate set
    std::set<tracked_mem_label_t> *updated_set =
        is_write ? &current_instruction->dest_mems : &current_instruction->src_mems;

    // 3. Add all addresses to tracking
    for (uint64_t i = range_start; i <= range_end; i += MEM_TRACKING_GRANULARITY) {
        updated_set->insert(i);
    }
}

void TaintTracker::taint(taint_entry_type_t value_type)
{
    if (not enabled)
        return;
    if (current_instruction == nullptr)
        return;

    switch (value_type) {
    case taint_entry_type_t::TAINT_ENTRY_PC:
        // For PC: if the instruction is a control-flow instruction, taint RIP
        {
            instr_t *instr = decoder.get_decoded_instr(current_instruction->dc,
                                                       (byte *)current_instruction->instr_obs.pc);
            if ((instr_is_cbr(instr) || instr_is_ubr(instr))) {
                pending_taint.insert(static_cast<tracked_label_t>(DR_REG_RIP));
            }
        }
        break;

    case taint_entry_type_t::TAINT_ENTRY_MEM:
        // For MEM: taint memory address registers
        {
            for (const auto &reg : current_instruction->mem_address_regs) {
                pending_taint.insert(static_cast<tracked_label_t>(reg));
            }
        }
        break;

    case taint_entry_type_t::TAINT_ENTRY_EOT:
        // End of trace - do nothing
        break;
    }
}

void TaintTracker::finalize_instruction()
{
    DR_ASSERT_MSG(current_instruction != nullptr,
                  "TaintTracker::finalize_instruction called before track_instruction");

    // Extract dependencies of the tracked instruction
    add_dependencies(current_instruction.get());

    // Update taints - propagate dependencies to tainted labels
    for (const auto &label : pending_taint) {
        std::set<tracked_label_t> tainted_values;

        // Check if label is a memory address (high bit set or > max register ID)
        // Register IDs are typically small (< 256), memory addresses are large
        if (label_is_reg(label)) {
            auto it = dependencies.reg.find(static_cast<tracker_reg_label_t>(label));
            if (it != dependencies.reg.end()) {
                tainted_values = it->second;
            } else {
                tainted_values.insert(label);
            }
        } else {
            auto it = dependencies.mem.find(label);
            if (it != dependencies.mem.end()) {
                tainted_values = it->second;
            } else {
                tainted_values.insert(label);
            }
        }

        tainted_labels.insert(tainted_values.begin(), tainted_values.end());
    }
    dbg_print_taints();

    // Clear dependencies of overwritten registers
    // NOTE: this must be done *after* the taint update, or the taints will be lost
    // dbg_print_dependencies();
    remove_overwritten_dependencies(current_instruction.get());
    dbg_print_dependencies();

    // Reset the instruction
    current_instruction.reset();
}

// =================================================================================================
// Private Methods
// =================================================================================================

void TaintTracker::parse_instruction_operands(TrackedInstruction *tracked_inst)
{
    // Decode the instruction from PC (using cache for efficiency)
    instr_t *instr =
        decoder.get_decoded_instr(tracked_inst->dc, (byte *)tracked_inst->instr_obs.pc);

    // Process destination operands
    const int num_dsts = instr_num_dsts(instr);
    for (int i = 0; i < num_dsts; i++) {
        const opnd_t opnd = instr_get_dst(instr, i);
        track_operand(false, opnd, tracked_inst);
    }

    // Process source operands
    const int num_srcs = instr_num_srcs(instr);
    for (int i = 0; i < num_srcs; i++) {
        const opnd_t opnd = instr_get_src(instr, i);
        track_operand(true, opnd, tracked_inst);
    }

    // Check for implicit EFLAGS operands (DynamoRIO doesn't include them in explicit operands)
    const uint eflags = instr_get_eflags(instr, DR_QUERY_DEFAULT);
    track_flags(eflags, tracked_inst);

    // Check for implicit RIP operand (for control-flow instructions)
    if (instr_is_cbr(instr) || instr_is_ubr(instr)) {
        tracked_inst->dest_regs.insert(DR_REG_RIP);
    }
}

std::set<tracked_label_t>
TaintTracker::collect_source_dependencies(const TrackedInstruction *tracked_inst) const
{
    std::set<tracked_label_t> src_dependencies;

    // Collect dependencies from source registers
    for (const auto &reg : tracked_inst->src_regs) {
        auto it = dependencies.reg.find(reg);
        if (it != dependencies.reg.end()) {
            src_dependencies.insert(it->second.begin(), it->second.end());
        } else {
            src_dependencies.insert(static_cast<tracked_label_t>(reg));
        }
    }

    // Collect dependencies from source memory locations
    for (const auto &addr : tracked_inst->src_mems) {
        auto it = dependencies.mem.find(addr);
        if (it != dependencies.mem.end()) {
            src_dependencies.insert(it->second.begin(), it->second.end());
        } else {
            src_dependencies.insert(addr);
        }
    }

    // Collect dependencies from memory address registers
    for (const auto &reg : tracked_inst->mem_address_regs) {
        auto it = dependencies.reg.find(reg);
        if (it != dependencies.reg.end()) {
            src_dependencies.insert(it->second.begin(), it->second.end());
        } else {
            src_dependencies.insert(static_cast<tracked_label_t>(reg));
        }
    }

    return src_dependencies;
}

template <typename LabelT>
void TaintTracker::propagate_dependencies_to_dest(
    LabelT dest_label, const std::set<tracked_label_t> &src_dependencies,
    std::map<LabelT, std::set<tracked_label_t>> &dep_map)
{
    // If destination already has dependencies, merge with source dependencies
    if (dep_map.find(dest_label) != dep_map.end()) {
        dep_map[dest_label].insert(src_dependencies.begin(), src_dependencies.end());
    } else {
        // Create new dependency entry with source dependencies
        dep_map[dest_label] = src_dependencies;
        // Add the destination itself to its own dependencies
        dep_map[dest_label].insert(static_cast<tracked_label_t>(dest_label));
    }
}

// Explicit template instantiations
template void TaintTracker::propagate_dependencies_to_dest(
    tracker_reg_label_t, const std::set<tracked_label_t> &,
    std::map<tracker_reg_label_t, std::set<tracked_label_t>> &);
template void TaintTracker::propagate_dependencies_to_dest(
    tracked_mem_label_t, const std::set<tracked_label_t> &,
    std::map<tracked_mem_label_t, std::set<tracked_label_t>> &);

void TaintTracker::add_dependencies(const TrackedInstruction *tracked_inst)
{
    // Get dependencies of the source operands
    const std::set<tracked_label_t> src_dependencies = collect_source_dependencies(tracked_inst);

    // Propagate source dependencies to destination registers
    for (const auto &reg : tracked_inst->dest_regs) {
        propagate_dependencies_to_dest(reg, src_dependencies, dependencies.reg);
    }

    // Propagate source dependencies to destination memory locations
    for (const auto &mem : tracked_inst->dest_mems) {
        propagate_dependencies_to_dest(mem, src_dependencies, dependencies.mem);
    }
}

void TaintTracker::remove_overwritten_dependencies(const TrackedInstruction *tracked_inst)
{
    // Check if this is a MOV or LEA instruction that overrides previous dependencies
    if (not is_override_instruction(tracked_inst, &decoder)) {
        return;
    }

    // Get source dependencies (reuse helper to avoid duplication)
    // Note: We only need src_regs and src_mems here, not mem_address_regs,
    // but including them doesn't affect correctness and keeps code simple
    std::set<tracked_label_t> src_dependencies = collect_source_dependencies(tracked_inst);

    // Remove dependencies that are not in source dependencies
    const tracker_reg_label_t dest_reg = *tracked_inst->dest_regs.begin();
    auto it = dependencies.reg.find(dest_reg);
    if (it != dependencies.reg.end()) {
        auto &deps = it->second;
        for (auto dep_it = deps.begin(); dep_it != deps.end();) {
            if (src_dependencies.find(*dep_it) == src_dependencies.end()) {
                dep_it = deps.erase(dep_it);
            } else {
                ++dep_it;
            }
        }
    }
}

void TaintTracker::store_taints()
{
    DR_ASSERT_MSG(stream.is_open(), "TaintTracker::store_taints: output stream is not open");

    // Write all collected labels to the output file
    for (const auto &label : tainted_labels) {
        uint64_t value = 0;
        if (label_is_reg(label)) {
            auto dr_reg_id = static_cast<reg_id_t>(label);
            const RVZRRegId reg_id = dr_reg_id_to_rvzr_reg_id(dr_reg_id);
            if (reg_id == RVZRRegId::RVZR_REG_IGNORED) {
                continue; // Do not store taints of ignored registers
            }
            value = static_cast<uint64_t>(reg_id);
        } else {
            // Memory address: convert from absolute to sandbox-relative
            DR_ASSERT_MSG(sandbox_base != 0,
                          "TaintTracker::store_taints: sandbox_base not initialized");
            value = label - sandbox_base;
        }

        stream.write(reinterpret_cast<const char *>(&value), sizeof(uint64_t));
    }

    // Write end-of-taint marker
    auto eot = EOT_MARKER;
    stream.write(reinterpret_cast<const char *>(&eot), sizeof(uint64_t));

    // NOTE: the file is not closed here as more taints may be added later if we
    // are tracing multiple inputs; the stream is closed in the destructor
}

void TaintTracker::dbg_print_taints()
{
    dr_printf("[TAINT] Tainted labels after instruction:\n");
    for (const auto &label : tainted_labels) {
        dr_printf("  Tainted label: %lx\n", label);
    }
}

void TaintTracker::dbg_print_dependencies()
{
    dr_printf("[TAINT] Dependencies after instruction:\n");
    for (const auto &reg_dep : dependencies.reg) {
        dr_printf("  Reg 0x%2lx depends on: ", reg_dep.first);
        for (const auto &dep : reg_dep.second) {
            dr_printf("0x%lx ", dep);
        }
        dr_printf("\n");
    }
    for (const auto &mem_dep : dependencies.mem) {
        dr_printf("  Mem 0x%lx depends on: ", mem_dep.first);
        for (const auto &dep : mem_dep.second) {
            dr_printf("0x%lx ", dep);
        }
        dr_printf("\n");
    }
    dr_printf("------------------------------------------------\n");
}


================================================
FILE: rvzr/model_dynamorio/backend/tracer_abc.cpp
================================================
///
/// File: Abstract Model TracerABC
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstdint>
#include <cstdio>
#include <cstdlib>
#include <string>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_events.h>
#include <dr_ir_instr.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h>
#include <dr_tools.h>

#include <drmgr.h>
#include <drreg.h>
#include <drvector.h>

#include "observables.hpp"
#include "tracer_abc.hpp"
#include "types/input_taint.hpp"
#include "types/trace.hpp"

using std::string;

// =================================================================================================
// Constructors and Destructors
// =================================================================================================
TracerABC::TracerABC(const std::string &out_path, Logger &logger, TaintTracker &taint_tracker,
                     Decoder &decoder, bool print)
    : logger(logger), taint_tracker(taint_tracker), decoder(decoder), trace(print)
{
    // Initialize trace buffers
    trace.open(out_path);
}

TracerABC::~TracerABC()
{
    if (not tracing_finalized) {
        finalize();
    }
    trace.clear();
    if (logger.is_enabled()) {
        logger.close();
    }
}

// =================================================================================================
// Public Methods
// =================================================================================================
void TracerABC::enable()
{
    tracing_on = true;
    tracing_finalized = false;
}

void TracerABC::finalize()
{
    if (tracing_finalized) {
        return;
    }

    // Push the end-of-trace marker and flush the remaining entries.
    trace.push_back({.type = trace_entry_type_t::ENTRY_EOT});
    trace.flush();

    // Print the trace buffers
    if (logger.is_enabled()) {
        logger.log_eot();
    }

    // Reset tracing flags
    tracing_on = false;
    tracing_finalized = true;
}

void TracerABC::observe_instruction(instr_obs_t /*instr*/, dr_mcontext_t * /*mc*/, void * /*dc*/)
{
    // The rest of the functionality - if any - is implemented by subclasses
}

void TracerABC::observe_mem_access(bool /*is_write*/, void * /*address*/, uint64_t /*size*/)
{
    // The rest of the functionality - if any - is implemented by subclasses
}

void TracerABC::observe_exception(dr_siginfo_t *siginfo) const
{
    if (not tracing_on) {
        return;
    }

    trace.push_back({.addr = (pc_t)siginfo->access_address,
                     .size = (uint32_t)siginfo->sig,
                     .type = trace_entry_type_t::ENTRY_EXCEPTION});
}

void TracerABC::record_pc(instr_obs_t instr)
{
    taint_tracker.taint(taint_entry_type_t::TAINT_ENTRY_PC);

    const trace_entry_t entry = {
        .addr = instr.pc,
        .size = 0,
        .type = trace_entry_type_t::ENTRY_PC,
    };
    trace.push_back(entry);
}

void TracerABC::record_mem_access(bool is_write, void *address, uint64_t size)
{
    taint_tracker.taint(taint_entry_type_t::TAINT_ENTRY_MEM);

    const trace_entry_t entry = {
        .addr = reinterpret_cast<uint64_t>(address),
        .size = (uint32_t)size,
        .type = (is_write) ? trace_entry_type_t::ENTRY_WRITE : trace_entry_type_t::ENTRY_READ,
    };
    trace.push_back(entry);
}


================================================
FILE: rvzr/model_dynamorio/backend/tracers/ct.cpp
================================================
///
/// File: Constant-time (CT) Tracer implementation and its variants
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstddef>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_macros.h>
#include <dr_ir_macros_x86.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h>
#include <drutil.h>

#include "tracers/ct.hpp"
#include "util.hpp"

void TracerCT::observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    TracerABC::observe_instruction(instr, mc, dc);

    // Nothing to do if tracing is off
    if (not tracing_on) {
        return;
    }

    record_pc(instr);
}

void TracerCT::observe_mem_access(bool is_write, void *address, uint64_t size)
{
    TracerABC::observe_mem_access(is_write, address, size);

    // Nothing to do if tracing is off
    if (not tracing_on) {
        return;
    }

    record_mem_access(is_write, address, size);
}


================================================
FILE: rvzr/model_dynamorio/backend/tracers/ind.cpp
================================================
///
/// File: Indirect Call Tracer implementation
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <optional>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_macros.h>
#include <dr_ir_macros_x86.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h>
#include <drutil.h>

#include "dr_tools.h"
#include "tracers/ind.hpp"
#include "types/decoder.hpp"

// =================================================================================================
// Local helper functions
// =================================================================================================

/// @brief Summary of the relevant information for indirect branches
typedef struct {
    pc_t src;
    pc_t target;
} mbr_info_t;

/// @brief If the instruction is a multi-branch instruction, get the source and target,
/// otherwise return an empty option.
static std::optional<mbr_info_t> get_mbr_info(instr_obs_t instr, dr_mcontext_t *mc, void *dc,
                                              Decoder &decoder)
{
    // Decode the instruction using the shared cache
    instr_t *cur_instr = decoder.get_decoded_instr(dc, (byte *)instr.pc);

    // Check if it's an indirect jump or ret (a.k.a. multi-way branch).
    if (not instr_is_mbr(cur_instr))
        return {}; // ignore

    const opnd_t target = instr_get_target(cur_instr);
    app_pc target_addr = nullptr;
    bool is_target_in_memory = false;

    // Get the target, depending on the type of instruction
    if (instr_is_return(cur_instr)) {
        target_addr = (app_pc)mc->xsp;
        is_target_in_memory = true;
    } else if (opnd_is_reg(target)) {
        const reg_id_t reg = opnd_get_reg(target);
        target_addr = (app_pc)reg_get_value(reg, mc);
        is_target_in_memory = false;
    } else if (opnd_is_memory_reference(target)) {
        target_addr = opnd_compute_address(target, mc);
        is_target_in_memory = true;
    } else {
        dr_printf("[ERROR] ind_tracer: Unknown target operand type\n");
        dr_abort();
        return {}; // unreachable
    }

    // Load the target if it's in memory
    if (is_target_in_memory) {
        uint64_t loaded_val = 0;
        if (dr_safe_read(target_addr, sizeof(uint64_t), &loaded_val, nullptr)) {
            target_addr = (app_pc)loaded_val;
        } else {
            dr_printf("[ERROR] ind_tracer: Failed to read the target from memory\n");
            dr_abort();
            return {}; // unreachable
        }
    }

    return mbr_info_t{.src = instr.pc, .target = (uint64_t)target_addr};
}

// =================================================================================================
// Class implementation
// =================================================================================================

void TracerInd::observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    TracerABC::observe_instruction(instr, mc, dc);

    // Nothing to do if tracing is off
    if (not tracing_on) {
        return;
    }

    // Decode the instruction using the shared cache
    const auto &mbr_info = get_mbr_info(instr, mc, dc, decoder);

    // Skip if not a branch
    if (not mbr_info)
        return;

    // FIXME: refactor to use similar pattern as in record_pc and record_mem_access
    // Log source
    trace.push_back({
        .addr = mbr_info->src,
        .size = 0,
        .type = trace_entry_type_t::ENTRY_PC,
    });
    // Log destination
    trace.push_back({
        .addr = mbr_info->target,
        .size = 0,
        .type = trace_entry_type_t::ENTRY_IND,
    });
}


================================================
FILE: rvzr/model_dynamorio/backend/tracers/pc.cpp
================================================
///
/// File: Program Counter (PC) Tracer implementation
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstddef>

#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_macros.h>
#include <dr_ir_macros_x86.h>
#include <dr_ir_opnd.h>
#include <dr_ir_utils.h>
#include <drutil.h>

#include "tracers/pc.hpp"
#include "util.hpp"

void TracerPC::observe_instruction(instr_obs_t instr, dr_mcontext_t *mc, void *dc)
{
    TracerABC::observe_instruction(instr, mc, dc);

    // Nothing to do if tracing is off
    if (not tracing_on) {
        return;
    }

    record_pc(instr);
}


================================================
FILE: rvzr/model_dynamorio/backend/util.cpp
================================================
///
/// File: Helper functions for DR model
///
// Copyright (C) Microsoft Corporation
// SPDX-License-Identifier: MIT

#include <cstddef>

#include <cstdint>
#include <dr_api.h> // NOLINT
#include <dr_defines.h>
#include <dr_ir_opnd.h>
#include <dr_tools.h>

#include <drreg.h>
#include <drvector.h>

#include "observables.hpp"
#include "types/decoder.hpp"
#include "util.hpp"

void reserve_register_checked(void *drcontext, instrlist_t *ilist, instr_t *where,
                              drvector_t *permitted, DR_PARAM_OUT reg_id_t *reg)
{
    if (drreg_reserve_register(drcontext, ilist, where, permitted, reg) != DRREG_SUCCESS) {
        dr_printf("ERROR: failed to reserve a register\n");
        dr_abort();
    }
}

void unreserve_register_checked(void *drcontext, instrlist_t *ilist, instr_t *where, reg_id_t reg)
{
    if (drreg_unreserve_register(drcontext, ilist, where, reg) != DRREG_SUCCESS) {
        dr_printf("ERROR: failed to unreserve a register\n");
        dr_abort();
    }
}

bool force_write(byte *addr, size_t size, const uint64_t *val, size_t *w_size)
{
    // Read page protections
    uint prot = -1;
    dr_query_memory(addr, nullptr, nullptr, &prot);

    // Make page writable
    dr_memory_protect(addr, size, DR_MEMPROT_READ | DR_MEMPROT_WRITE | DR_MEMPROT_EXEC);
    const bool success = dr_safe_write(addr, size, val, w_size);
    // Restore previous protections
    dr_memory_protect(addr, size, prot);

    return success;
}

bool is_illegal_jump(instr_obs_t instr, dr_mcontext_t *mc, void *dc, Decoder &decoder)
{
    // Decode the instruction
    instr_t *cur_instr = decoder.get_decoded_instr(dc, (byte *)instr.pc);

    // Check if it's an indirect jump or ret (a.k.a. multi-way branch).
    if (not instr_is_mbr(cur_instr))
        return false; // ignore

    const opnd_t target = instr_get_target(cur_instr);
    app_pc target_addr = nullptr;
    bool is_target_in_memory = false;

    // Get the target, depending on the type of instruction
    if (instr_is_return(cur_instr)) {
        target_addr = (app_pc)mc->xsp;
        is_target_in_memory = true;
    } else if (opnd_is_reg(target)) {
        const reg_id_t reg = opnd_get_reg(target);
        target_addr = (app_pc)reg_get_value(reg, mc);
        is_target_in_memory = false;
    } else if (opnd_is_memory_reference(target)) {
        target_addr = opnd_compute_address(target, mc);
        is_target_in_memory = true;
    } else {
        return false; // ignore
    }

    // Load the target if it's in memory
    if (is_target_in_memory) {
        uint64_t loaded_val = 0;
        if (dr_safe_read(target_addr, sizeof(uint64_t), &loaded_val, nullptr)) {
            target_addr = (app_pc)loaded_val;
        } else {
            return true; // invalid target
        }
    }

    // Check the permissions of the target address
    uint prot = 0;
    const bool target_exists = dr_query_memory(target_addr, nullptr, nullptr, &prot);
    const bool target_is_executable = (prot & DR_MEMPROT_EXEC) != 0;

    // Target can be followed only if it's a valid executable address
    const bool target_is_valid = target_exists and target_is_executable;
    return not target_is_valid;
}

void flush_bb_cache()
{
    const uint64_t flush_begin = 0;
    const size_t flush_size = -1;

    // NOTE: This is very conservative, but avoids any potentially expensive analysis of
    // the target function
    dr_delay_flush_region((byte *)flush_begin, flush_size, /*flush_id*/ 0, /*callback*/ nullptr);
}


================================================
FILE: rvzr/model_dynamorio/model.py
================================================
"""
File: DynamoRIO-based backend to the contract model.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import os
import tempfile
from subprocess import check_output, CalledProcessError, STDOUT
from typing import List, Tuple, Optional, TYPE_CHECKING, Final, Any
from typing_extensions import TypeAlias

import numpy as np
from numpy.typing import NDArray

from .trace_decoder import TraceDecoder, TraceEntryType, DebugTraceEntryType

from ..model import Model
from ..sandbox import BaseAddrTuple, SandboxLayout, DataArea
from ..traces import CTrace, CTraceEntry
from ..tc_components.test_case_data import save_input_sequence_as_rdbf, InputTaint
from ..config import CONF

if TYPE_CHECKING:
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.test_case_data import InputData

_DRRUN_TRACING_FLAGS: Final[str] = " --mode rvzr --instrumented-func test_case_entry "
_ADAPTER_PATH: Final[str] = "~/.local/dynamorio/adapter"
_DRRUN_CMD: Final[str] = "~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so " \
    " {flags} -- {binary} {args}"

# Constants for trace processing
_N_REGISTERS_IN_DUMP: Final[int] = 6  # rax, rbx, rcx, rdx, rsi, rdi
_BYTES_PER_TAINT_ENTRY: Final[int] = 8  # each taint entry corresponds to 8 bytes
_EOT_MARKER: Final[int] = np.iinfo(np.uint64).max  # end-of-transmission marker for taint files

# Type aliases for raw trace entries (CFFI objects from TraceDecoder)
# Note: These are dynamically typed CFFI objects, so we use Any with documentation
_RawTraceEntry: TypeAlias = Any  # CFFI struct: trace_entry_t with addr, size, type fields
_RawDebugTraceEntry: TypeAlias = Any  # CFFI struct: debug_trace_entry_t with type, regs union
_RawTrace: TypeAlias = List[_RawTraceEntry]  # List of trace entries from one test execution
_RawDebugTrace: TypeAlias = List[_RawDebugTraceEntry]  # List of debug trace entries


class DynamoRIOModel(Model):
    """
    Adapter class that connects the DynamoRIO backend to the rest of Revizor.
    """
    _obs_clause_name: Optional[str] = None
    _exec_clause_name: Optional[str] = None

    _installation_checked: bool = False  # flag to avoid checking DR installation multiple times

    _test_case: Optional[TestCaseProgram] = None  # the current test case
    _files: _DRFileManager

    poison_value: int = 0  # If this value is != 0, it will be returned on speculative faulty loads

    # ----------------------------------------------------------------------------------------------
    # Constructor/Destructor
    def __init__(self,
                 bases: BaseAddrTuple,
                 *args: Any,
                 enable_mismatch_check_mode: bool = False) -> None:
        # NOTE: the `bases` argument is not used as DynamoRIO backend does not allow
        #       for customization of the memory layout
        self._enable_mismatch_check_mode = enable_mismatch_check_mode
        self.is_speculative = True  # may be changed by configure_clauses
        self.poison_value = 0  # may be changed later
        self._files = _DRFileManager()

    def __del__(self) -> None:
        self._files.delete_temp_files()

    # ----------------------------------------------------------------------------------------------
    # Public Interfaces
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Prepare the test case to be traced by the DynamoRIO backend.
        This means creating a binary in the RCBF format so that it can be parsed by the backend.
        :param test_case: the test case to load
        :return: None
        """
        self._test_case = test_case

        # remove the previous RCBF file if it exists and create a new one
        self._files.cleanup_on_load_test_case()

        # store the test case in the RCBF format
        test_case.get_obj().save_rcbf(self._files.rcbf)

    def trace_test_case(self, inputs: List[InputData], nesting: int) -> List[CTrace]:
        """ Implementation of Model.trace_test_case using the DynamoRIO backend. """
        trace = self._trace_test_case_common(inputs, nesting, enable_taints=False)
        self._files.cleanup_after_tracing()
        return trace

    def trace_test_case_with_taints(self, inputs: List[InputData],
                                    nesting: int) -> Tuple[List[CTrace], List[InputTaint]]:
        """ Implementation of Model.trace_test_case_with_taints using the DynamoRIO backend. """
        traces = self._trace_test_case_common(inputs, nesting, enable_taints=True)
        assert self._test_case is not None, "Test case must be loaded before tracing"
        taint_reader = _TaintReader(self.layout, self._test_case)
        taints = taint_reader.decode_taints(self._files.taints)
        self._files.cleanup_after_tracing()
        return traces, taints

    def report_coverage(self, path: str) -> None:
        raise NotImplementedError()

    def configure_clauses(self, obs_clause_name: str, exec_clause_name: str) -> None:
        """
        Configure the backend to use the given observation and execution clauses.
        Also check if the given clauses are supported.
        :param obs_clause_name: the name of the observation clause
        :param exec_clause_name: the name of the execution clause
        :return: None
        :raises: ValueError if the given clauses are not supported
        """
        assert self._obs_clause_name is None and self._exec_clause_name is None, \
            "Cannot reconfigure the observation and execution clauses"

        # ensure that the DynamoRIO backend is installed
        self._check_if_installed()

        # check if the contract is supported
        if obs_clause_name not in self.get_supported_obs_clauses(False):
            raise ValueError(f"Unsupported observation clause {obs_clause_name}")
        self._obs_clause_name = obs_clause_name

        if exec_clause_name not in self.get_supported_exec_clauses(False):
            raise ValueError(f"Unsupported execution clause {exec_clause_name}")
        self._exec_clause_name = exec_clause_name

        if exec_clause_name in ["seq", "no_speculation"]:
            self.is_speculative = False

    @classmethod
    def get_supported_obs_clauses(cls, check_installation: bool = True) -> List[str]:
        """
        Get the list of supported observation clauses.
        :return: list of supported observation clauses
        :raises: FileNotFoundError if the DynamoRIO backend is not installed
        """
        if check_installation:
            cls._check_if_installed()
        cmd = _DRRUN_CMD.format(flags="--list-tracers", binary="echo", args="''")
        output = check_output(cmd, shell=True).decode("utf-8")
        return output.split("\n")[:-1]

    @classmethod
    def get_supported_exec_clauses(cls, check_installation: bool = True) -> List[str]:
        """
        Get the list of supported execution clauses.
        :return: list of supported execution clauses
        :raises: FileNotFoundError if the DynamoRIO backend is not installed
        """
        if check_installation:
            cls._check_if_installed()
        cmd = _DRRUN_CMD.format(flags="--list-speculators", binary="echo", args="''")
        output = check_output(cmd, shell=True).decode("utf-8")
        return output.split("\n")[:-1]

    # ----------------------------------------------------------------------------------------------
    # Private Methods
    @classmethod
    def _check_if_installed(cls) -> None:
        """
        Ensure that the DynamoRIO backend is installed.
        :return: None
        :raises: FileNotFoundError if the DynamoRIO backend is not installed
        """
        if not cls._installation_checked:  # check only once
            cmd = _DRRUN_CMD.format(flags="--trace-output /dev/null", binary="ls", args="/dev/null")
            try:
                output = check_output(cmd, shell=True, stderr=STDOUT).decode("utf-8")
            except (FileNotFoundError, CalledProcessError):
                output = ""
            if '/dev/null' not in output:
                raise FileNotFoundError(
                    "DynamoRIO backend is not installed\n\n\n"
                    "Please follow the instructions in "
                    "https://microsoft.github.io/side-channel-fuzzer/quick-start/")
            cls._installation_checked = True

    def _trace_test_case_common(self, inputs: List[InputData], nesting: int,
                                enable_taints: bool) -> List[CTrace]:
        """
        Execute the test case with the given inputs on DR backend and return the traces
        and the sandbox addresses.
        :param inputs: input sequence to trace
        :param nesting: maximum nesting level to emulated in the model
        :return: list of contract traces, one per input
        """
        assert self._test_case is not None, "No test case was loaded"
        if len(inputs) == 0:
            return []

        # store the input sequence
        save_input_sequence_as_rdbf(inputs, self._files.rdbf)

        # call the backend
        cmd = self._construct_drrun_cmd(enable_taints, nesting)
        _ = check_output(cmd, shell=True)

        # the execution might have had a different layout than before, update it
        self._update_layout()

        # read traces from the trace files
        reader = _TraceReader(self.layout, self._test_case)
        traces = reader.decode_traces(self._files.traces)
        assert len(traces) > 0, "No traces were retrieved from the DynamoRIO backend"
        assert len(traces) == len(inputs), "Mismatch between the number of inputs and traces"

        if self._enable_mismatch_check_mode:
            # In this mode, the contract trace is the register values at the end of the test case
            dbg_reader = _DbgTraceReader(self.layout, self._test_case)
            dbg_traces = dbg_reader.decode_traces(self._files.dbg_traces)
            arch_traces = [CTrace(t.get_typed()[-_N_REGISTERS_IN_DUMP:]) for t in dbg_traces]
            return arch_traces

        return traces

    def _construct_drrun_cmd(self, enable_taints: bool, nesting: int) -> str:
        """
        Construct a command to call the DynamoRIO backend
        with the given test case and input sequence.
        """
        flags = _DRRUN_TRACING_FLAGS + \
            f" --tracer {self._obs_clause_name}" + \
            f" --speculator {self._exec_clause_name}" + \
            f" --max-nesting {nesting}" + \
            f" --max-spec-window {CONF.model_max_spec_window}" \
            f" --trace-output {self._files.traces}"
        if enable_taints:
            flags += f" --taint-output {self._files.taints} --enable-taint-tracker"
        if self._enable_mismatch_check_mode:
            flags += f" --log-level 1 --debug-trace-output {self._files.dbg_traces}"
        if self.poison_value != 0:
            flags += f" --poison-value {self.poison_value}"

        binary = _ADAPTER_PATH
        args = f"{self._files.rcbf} {self._files.rdbf} {self._files.layout}"
        cmd = _DRRUN_CMD.format(flags=flags, binary=binary, args=args)
        # print(cmd)
        return cmd

    def _update_layout(self) -> None:
        """ Update the memory layout based on the addresses communicated by the adapter
        via the bases file. """
        assert self._test_case is not None, "No test case was loaded"
        with open(self._files.layout, 'rb') as f:
            code_base_addr = int.from_bytes(f.read(8), byteorder="little")
            data_base_addr = int.from_bytes(f.read(8), byteorder="little")
        self.layout = SandboxLayout((data_base_addr, code_base_addr), self._test_case.n_actors())


# ==================================================================================================
# Private: File management
# ==================================================================================================
class _DRFileManager:
    """
    Local class responsible for managing temporary files used by the DynamoRIO backend.
    """

    def __init__(self) -> None:
        self.rcbf: str  # tmp file for current test case in RCBF format
        self.rdbf: str  # tmp file for current input sequence in RDBF format
        self.layout: str  # tmp file for receiving memory layout
        self.traces: str  # tmp file for receiving contract traces
        self.dbg_traces: str  # tmp file for receiving debug traces
        self.taints: str  # tmp file for receiving taint traces
        self._create_temp_files()

    def cleanup_on_load_test_case(self) -> None:
        """ Clean up RCBF and RDBF files when loading a new test case """
        with open(self.rcbf, 'wb') as f:
            f.truncate()
        with open(self.rdbf, 'wb') as f:
            f.truncate()

    def cleanup_after_tracing(self) -> None:
        """ Clean up the files that will be used by the adapter to store its output """
        with open(self.traces, 'wb') as f:
            f.truncate()
        with open(self.dbg_traces, 'wb') as f:
            f.truncate()
        with open(self.taints, 'wb') as f:
            f.truncate()
        with open(self.layout, 'wb') as f:
            f.truncate()

    def _create_temp_files(self) -> None:
        with tempfile.NamedTemporaryFile("wb", delete=False) as rcbf_f:
            self.rcbf = rcbf_f.name
        with tempfile.NamedTemporaryFile("wb", delete=False) as rdbf_f:
            self.rdbf = rdbf_f.name
        with tempfile.NamedTemporaryFile("wb", delete=False) as trace_f:
            self.traces = trace_f.name
        with tempfile.NamedTemporaryFile("wb", delete=False) as dbg_trace_f:
            self.dbg_traces = dbg_trace_f.name
        with tempfile.NamedTemporaryFile("wb", delete=False) as taint_f:
            self.taints = taint_f.name
        with tempfile.NamedTemporaryFile("wb", delete=False) as bases_f:
            self.layout = bases_f.name

    def delete_temp_files(self) -> None:
        """ Delete all temporary files created for the DynamoRIO backend """
        if os.path.exists(self.rcbf):
            os.unlink(self.rcbf)
        if os.path.exists(self.rdbf):
            os.unlink(self.rdbf)
        if os.path.exists(self.traces):
            os.unlink(self.traces)
        if os.path.exists(self.dbg_traces):
            os.unlink(self.dbg_traces)
        if os.path.exists(self.taints):
            os.unlink(self.taints)
        if os.path.exists(self.layout):
            os.unlink(self.layout)


# ==================================================================================================
# Private: Decoding of Traces
# ==================================================================================================
class _TraceReader:
    """
    Local class responsible for reading traces produced by DynamoRIO backend,
    removing irrelevant information from them, and converting them to the
    format that is expected by the contract model.
    """

    def __init__(self, layout: SandboxLayout, test_case: TestCaseProgram) -> None:
        self._layout = layout
        self._test_case = test_case
        self._decoder = TraceDecoder()

    def decode_traces(self, trace_path: str) -> List[CTrace]:
        """
        Read the traces produced by the DynamoRIO backend and return them in the format
        that is expected by the contract model.
        :return: list of contract traces
        """
        traces: List[CTrace] = []

        # iterate over the binary trace and parse the entries
        raw_traces: List[_RawTrace] = self._decoder.decode_trace_file(trace_path)
        for raw_trace in raw_traces:
            converted = self._raw_to_ctrace(raw_trace)
            if converted:
                traces.append(converted)

        # trim non relevant entries
        traces = self._trim_traces(traces)

        return traces

    def _raw_to_ctrace(self, raw_trace: _RawTrace) -> CTrace:
        trace: List[CTraceEntry] = []

        for entry in raw_trace:
            type_ = TraceEntryType(entry.type)
            if type_ in (TraceEntryType.ENTRY_READ, TraceEntryType.ENTRY_WRITE):
                val = self._layout.data_addr_to_offset(entry.addr)
                trace.append(CTraceEntry(type_="mem", value=val))
            elif type_ == TraceEntryType.ENTRY_PC:
                val = self._layout.code_addr_to_offset(entry.addr)
                trace.append(CTraceEntry(type_="pc", value=val))
            elif type_ == TraceEntryType.ENTRY_IND:
                val = self._layout.code_addr_to_offset(entry.addr)
                trace.append(CTraceEntry(type_="ind", value=val))

        return CTrace(trace)

    def _trim_traces(self, traces: List[CTrace]) -> List[CTrace]:
        """
        Last instruction of the trace is the return instruction, which is inserted automatically
        by the model and thus does not belong to the test case. We remove the corresponding entries
        from the traces.
        :return: the traces with the irrelevant entries removed
        """
        new_traces: List[CTrace] = []
        for trace in traces:
            entry_list = trace.get_typed()

            # Identify observations that belong to the return instruction
            last_mem = None
            last_pc = None
            if entry_list[-1].type_ == "mem":
                last_mem = entry_list[-1].value
                entry_list.pop()
            if entry_list[-1].type_ == "pc":
                last_pc = entry_list[-1].value
                entry_list.pop()

            # In case the return happened multiple times (e.g., due to speculation),
            # remove all corresponding entries
            filtered_list = []
            for entry in entry_list:
                if last_pc is not None and entry.type_ == "pc" and entry.value == last_pc:
                    continue
                if last_mem is not None and entry.type_ == "mem" and entry.value == last_mem:
                    continue
                filtered_list.append(entry)

            new_traces.append(CTrace(filtered_list))

        return new_traces


class _DbgTraceReader:
    """
    Local class responsible for reading debug traces produced by DynamoRIO backend.
    """

    def __init__(self, layout: SandboxLayout, test_case: TestCaseProgram) -> None:
        self._layout = layout
        self._test_case = test_case
        self._decoder = TraceDecoder()

    def decode_traces(self, dbg_path: str) -> List[CTrace]:
        """
        Read the debug traces produced by the DynamoRIO backend and return them in the format
        that is expected by the contract model.
        :return: list of debug traces
        """
        dbg_traces: List[CTrace] = []

        # do the same for debug traces
        raw_dbg_traces: List[_RawDebugTrace] = self._decoder.decode_debug_trace_file(dbg_path)
        for raw_dbg_trace in raw_dbg_traces:
            converted = self._raw_dbg_to_ctrace(raw_dbg_trace)
            if converted:
                dbg_traces.append(converted)

        # trim non relevant entries
        if dbg_traces:
            dbg_traces = self._trim_dbg_traces(dbg_traces)

        return dbg_traces

    def _raw_dbg_to_ctrace(self, raw_dbg_trace: _RawDebugTrace) -> CTrace:
        trace: List[CTraceEntry] = []

        for entry in raw_dbg_trace:
            type_ = DebugTraceEntryType(entry.type)
            if type_ == DebugTraceEntryType.ENTRY_REG_DUMP:
                val = self._layout.code_addr_to_offset(entry.regs.pc)
                trace.append(CTraceEntry(type_="pc", value=val))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xax))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xbx))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xcx))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xdx))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xsi))
                trace.append(CTraceEntry(type_="reg", value=entry.regs.xdi))

        return CTrace(trace)

    def _trim_dbg_traces(self, dbg_traces: List[CTrace]) -> List[CTrace]:
        """ Same as _trim_traces, but for debug traces """
        # Each register dump consists of 1 PC + N register values
        dump_size = 1 + _N_REGISTERS_IN_DUMP

        new_dbg_traces = []
        for dbg_trace in dbg_traces:
            entry_list = dbg_trace.get_typed()

            # Remove the last register dump (corresponding to the return instruction)
            last_pc = None
            if entry_list[-dump_size].type_ == "pc":
                last_pc = entry_list[-dump_size].value
                entry_list = entry_list[:-dump_size]

            # Remove all register dumps corresponding to the return instruction
            filtered_list = []
            skip_count = 0
            for entry in entry_list:
                if skip_count > 0:
                    skip_count -= 1
                    continue
                if last_pc is not None and entry.type_ == "pc" and entry.value == last_pc:
                    skip_count = _N_REGISTERS_IN_DUMP  # skip the register entries as well
                    continue
                filtered_list.append(entry)

            new_dbg_traces.append(CTrace(filtered_list))

        return new_dbg_traces


# ==================================================================================================
# Private: Decoding of Input Taints
# ==================================================================================================
class _TaintReader:
    """
    Local class responsible for reading input taints produced by DynamoRIO backend.

    Taint output format:
    - Input 1:
        [taint_value (8 bytes)]
        ... repeated for each tainted value
        [end_marker (8 bytes)] (the marker is max_uint64)
    - Input 2:
        ...
    """

    def __init__(self, layout: SandboxLayout, test_case: TestCaseProgram) -> None:
        self._layout = layout
        self._n_actors = test_case.n_actors()

    def decode_taints(self, taint_path: str) -> List[InputTaint]:
        """
        Read the input taints produced by the DynamoRIO backend and return them in the format
        that is expected by the contract model.
        :return: list of input taints
        """
        taints: List[InputTaint] = []

        # for convenience, read the entire file into a numpy array
        array: NDArray[np.uint64] = self._file_to_ndarray(taint_path)
        sandbox_end: int = self._layout.data_area_offset(DataArea.OVERFLOW_PAD)

        taint = InputTaint(self._n_actors)
        linear_view = taint.full_linear_view()
        unfinished = False
        for entry in array:
            val = int(entry)

            # end marker reached? store the current input taint and start a new one
            if val == _EOT_MARKER:
                taints.append(taint)
                taint = InputTaint(self._n_actors)
                linear_view = taint.full_linear_view()
                unfinished = False
                continue
            unfinished = True

            if val > sandbox_end:
                # invalid taint value (may happen because some of the adapter code was tainted)
                continue

            linear_view[val // _BYTES_PER_TAINT_ENTRY] = True

        assert not unfinished, "Taint file ended unexpectedly without end marker"
        return taints

    def _file_to_ndarray(self, path: str) -> NDArray[np.uint64]:
        """
        Read the taint file and convert it to a numpy array.
        :return: numpy array containing the taint entries (uint64 values)
        """
        with open(path, 'rb') as f:
            data = f.read()
        n_entries = len(data) // _BYTES_PER_TAINT_ENTRY
        array = np.frombuffer(data, dtype=np.uint64, count=n_entries)
        return array


================================================
FILE: rvzr/model_dynamorio/trace_decoder.py
================================================
"""
File: This module provides a decoder for the binary traces generated by the DynamoRIO backend

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

from enum import Enum
from typing import Any, Final, List, Literal, Union, cast
from io import BufferedReader
import sys
import os

from cffi import FFI
from typing_extensions import get_args, assert_never

_MarkerType = Literal["T", "D"]

# ==================================================================================================
# Trace types
# ==================================================================================================
# TODO: autogenerate from trace.hpp
# NOTE: cffi cannot parse CPP constructs (e.g. enum classes, sdt::array) so we
#       need to manually adjust some of the fields.


class TraceEntryType(Enum):
    """
    Enum used for the trace entry type, copied from trace.hpp
    TODO: Cffi cannot parse enum classes, find a way to autogenerate from the header file
    """
    ENTRY_EOT = 0  # end of trace
    ENTRY_PC = 1
    ENTRY_READ = 2
    ENTRY_WRITE = 3
    ENTRY_EXCEPTION = 4
    ENTRY_IND = 5


_TRACE_ENTRY_T: Final[str] = "struct trace_entry_t"
_TRACE_ENTRY_DEF: Final[str] = """
struct trace_entry_t {
    // pc for instructions; address for memory accesses; target for indirect calls
    uint64_t addr;
    // instruction size for instructions; memory access size for memory accesses
    uint32_t size;
    // see trace_entry_type_t
    uint8_t type;
    // unused for now
    uint8_t padding[3]; // NOLINT
};
"""

# ==================================================================================================
# Debug Trace types
# ==================================================================================================
# TODO: autogenerate from debug_trace.hpp
# NOTE: cffi cannot parse CPP constructs (e.g. enum classes, sdt::array) so we
#       need to manually adjust some of the fields.


class DebugTraceEntryType(Enum):
    """
    Enum used for the debug trace entry type, copied from debug_trace.hpp
    TODO: Cffi cannot parse enum classes, find a way to autogenerate from the header file
    """
    ENTRY_EOT = 0  # end of trace
    ENTRY_REG_DUMP = 1
    ENTRY_READ = 2
    ENTRY_WRITE = 3
    ENTRY_LOC = 4
    ENTRY_EXCEPTION = 5
    ENTRY_CHECKPOINT = 6
    ENTRY_ROLLBACK = 7
    ENTRY_ROLLBACK_STORE = 8
    ENTRY_REG_DUMP_EXTENDED = 9


_DEBUG_TRACE_ENTRY_T: Final[str] = "struct debug_trace_entry_t"
_DEBUG_TRACE_ENTRY_DEF: Final[str] = """
struct debug_trace_entry_t {
    // What does this entry contain
    uint8_t type;
    // Nested speculation (0 is architectural)
    uint8_t nesting_level;
    // Unused for now
    uint8_t padding[6]; // NOLINT

    // Union of all possible entry types
    union {
        // ENTRY_REG_DUMP
        struct {
            uint64_t xax;
            uint64_t xbx;
            uint64_t xcx;
            uint64_t xdx;
            uint64_t xsi;
            uint64_t xdi;
            uint64_t pc;
        } regs;
        // ENTRY_REG_EXTENDED
        struct {
            uint64_t rsp;
            uint64_t rbp;
            uint64_t flags;
            uint64_t r8;
            uint64_t r9;
            uint64_t r10;
            uint64_t r11;
        } regs_2;
        // ENTRY_MEM (read or write)
        struct {
            uint64_t address;
            uint64_t value;
            uint64_t size;
        } mem;
        // ENTRY_LOC (module name and offset, for disassembly)
        struct {
            uint64_t offset;
            char module_name[48]; // NOLINT
        } loc;
        // ENTRY_EXCEPTION
        struct {
            int signal;
            uint64_t address;
        } xcpt;
        // ENTRY_CHECKPOINT
        struct {
            uint64_t rollback_pc;
            uint64_t cur_window_size;
            size_t cur_store_log_size;
        } checkpoint;
        // ENTRY_ROLLBACK
        struct {
            unsigned nesting;
            uint64_t rollback_pc;
        } rollback;
        // ENTRY_ROLLBACK_STORE
        struct {
            uint64_t addr;
            uint64_t val;
            size_t size;
            uint64_t nesting_level;
        } rollback_store;
    };
};
"""


# ==================================================================================================
# Decoder
# ==================================================================================================
class TraceDecoder:
    """
    This class provides a unified API for decoding trace entries
    """

    _ffi: FFI
    _trace_entry_size: int
    _debug_trace_entry_size: int

    def __init__(self) -> None:
        self._ffi = FFI()
        # Parse trace defs
        self._ffi.cdef(_TRACE_ENTRY_DEF)
        self._trace_entry_size = self._ffi.sizeof(_TRACE_ENTRY_T)
        # Parse debug trace defs
        self._ffi.cdef(_DEBUG_TRACE_ENTRY_DEF)
        self._debug_trace_entry_size = self._ffi.sizeof(_DEBUG_TRACE_ENTRY_T)

    # ----------------------------------------------------------------------------------------------
    # Public API
    # ----------------------------------------------------------------------------------------------
    def read_trace_marker(self, f: BufferedReader) -> Union[_MarkerType, Literal[""]]:
        """
        Get the type of the trace file.
        """
        marker = f.read(1).decode('utf-8')
        if len(marker) == 0:
            return ""
        assert marker in get_args(_MarkerType), f"Unknown trace type marker: {marker}"
        f.read(7)  # skip padding bytes
        return cast(_MarkerType, marker)

    def decode_trace_file(self, file: str) -> List[List[Any]]:
        """ Read a set of traces from a file. """
        with open(file, "rb") as f:
            marker = self.read_trace_marker(f)
            if marker == "":  # empty file
                return []
            assert marker == "T", f"Expected Normal trace (T), got {marker}"

            # Read the traces
            traces = []
            eof = False
            while not eof:

                entries = []
                while True:
                    # Read one entry
                    chunk = f.read(self._trace_entry_size)
                    if len(chunk) < self._trace_entry_size:
                        eof = True
                        break  # no more bytes to read: exit

                    # Decode it
                    entry = self._decode_trace_entry(chunk)
                    entries.append(entry)

                    # If we reached EOT, move on to the next trace
                    if TraceEntryType(entry.type) == TraceEntryType.ENTRY_EOT:
                        traces.append(entries)
                        break

                # Check that the last trace ended with an EOT entry or EXCEPTION
                if eof and len(entries) > 0:
                    last_entry = entries[-1]
                    if TraceEntryType(last_entry.type) != TraceEntryType.ENTRY_EOT:
                        raise ValueError("Trace file does not end with an EOT entry")

        return traces

    def decode_debug_trace_file(self, file: str) -> List[List[Any]]:
        """ Read a debug trace from a file. """
        with open(file, "rb") as f:
            marker = self.read_trace_marker(f)
            if marker == "":  # empty file
                return []
            assert marker == "D", f"Expected Debug trace (D), got {marker}"

            # Read the traces
            traces = []
            eof = False
            while not eof:

                entries = []
                while True:
                    # Read one entry
                    chunk = f.read(self._debug_trace_entry_size)
                    if len(chunk) < self._debug_trace_entry_size:
                        eof = True
                        break  # no more bytes to read: exit

                    # Decode it
                    entry = self._decode_debug_trace_entry(chunk)
                    entries.append(entry)

                    # If we reached EOT, move on to the next trace
                    if DebugTraceEntryType(entry.type) == DebugTraceEntryType.ENTRY_EOT:
                        traces.append(entries)
                        break

                # Check that the last trace ended with an EOT or EXCEPTION entry
                if eof and len(entries) > 0:
                    last_entry = entries[-1]
                    if DebugTraceEntryType(last_entry.type) != DebugTraceEntryType.ENTRY_EOT:
                        raise ValueError("Trace file does not end with an EOT entry")

        return traces

    def is_trace_corrupted(self, trace_path: str) -> bool:
        """
        Check if a trace ends with an EOT or EXCEPTION entry.
        """
        # Handle empty and non-existing traces as corrupted
        if not os.path.exists(trace_path) or os.stat(trace_path).st_size == 0:
            return True

        with open(trace_path, "rb") as f:
            trace_type = self.read_trace_marker(f)
            if trace_type == "":
                return True

            # Decode based on the type
            if trace_type == "T":
                entry_sz = self._ffi.sizeof(_TRACE_ENTRY_T)
                if os.stat(trace_path).st_size < entry_sz:
                    return True

                # Decode last entry
                f.seek(-entry_sz, os.SEEK_END)
                last_entry = self._decode_trace_entry(f.read(entry_sz))

                # Check its type
                last_entry_type = TraceEntryType(last_entry.type)
                return last_entry_type != TraceEntryType.ENTRY_EOT

            if trace_type == "D":
                entry_sz = self._ffi.sizeof(_DEBUG_TRACE_ENTRY_T)
                if os.stat(trace_path).st_size < entry_sz:
                    return True

                # Decode last entry
                f.seek(-entry_sz, os.SEEK_END)
                last_dbg_entry = self._decode_debug_trace_entry(f.read(entry_sz))

                # Check its type
                last_dbg_entry_type = DebugTraceEntryType(last_dbg_entry.type)
                return last_dbg_entry_type != DebugTraceEntryType.ENTRY_EOT

            assert_never(trace_type)

    # ----------------------------------------------------------------------------------------------
    # Private API
    # ----------------------------------------------------------------------------------------------
    def _decode_trace_entry(self, chunk: bytes) -> Any:
        """
        Decode a single entry from a chunk of bytes
        """
        # Decode it with ffi
        entry: Any = self._ffi.new(_TRACE_ENTRY_T + "*")
        self._ffi.memmove(entry, chunk, self._trace_entry_size)

        # Check that the entry type is valid
        try:
            TraceEntryType(entry.type)
        except Exception:
            raise ValueError(f"Error: Unknown trace entry type {str(entry.type)}")

        return entry

    def _decode_debug_trace_entry(self, chunk: bytes) -> Any:
        """
        Decode a single debug entry from a chunk of bytes
        """
        # Decode it with ffi
        entry: Any = self._ffi.new(_DEBUG_TRACE_ENTRY_T + "*")
        self._ffi.memmove(entry, chunk, self._debug_trace_entry_size)

        # Check that the entry type is valid
        try:
            DebugTraceEntryType(entry.type)
        except Exception:
            raise ValueError(f"Error: Unknown debug entry type {str(entry.type)}")

        return entry


def main() -> None:
    """ Standalone decoding interface: pretty-print trace entries from a file """
    if len(sys.argv) != 2:
        print(f"Usage {sys.argv[0]} <TRACE_PATH>")
        sys.exit(1)

    # 1. Create decoder
    decoder = TraceDecoder()

    # 2. Decode file
    with open(sys.argv[1], "rb") as f:
        trace_type = decoder.read_trace_marker(f)
    if trace_type == "":
        print(f"Empty trace file: {sys.argv[1]}")
        sys.exit(1)
    if trace_type == "T":
        parsed_traces = decoder.decode_trace_file(sys.argv[1])
    elif trace_type == "D":
        parsed_traces = decoder.decode_trace_file(sys.argv[1])
        print(f"Only leakage traces allowed: found {len(parsed_traces)} debug traces instead")
        sys.exit(1)
    else:
        assert_never(trace_type)

    # Check that the input contains leakage traces
    if len(parsed_traces) == 0:
        print(f"No traces found in {sys.argv[1]}")
        sys.exit(1)

    # 3. Print all entries
    for nt, trace_ in enumerate(parsed_traces):
        print("-------- TRACE --------")
        for ne, e in enumerate(trace_):
            try:
                # Parse the entry type
                type_ = TraceEntryType(e.type)
                print(f"[{type_.name}] {hex(e.addr)}")
            except Exception:
                raise ValueError(f"Failed to decode entry {ne} of trace {nt}")


if __name__ == '__main__':
    main()


================================================
FILE: rvzr/model_unicorn/__init__.py
================================================


================================================
FILE: rvzr/model_unicorn/coverage.py
================================================
"""
File: Class for tracking instruction coverage in fuzzing campaigns with Unicorn backend.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from collections import defaultdict

from typing import Dict, Optional
from typing_extensions import assert_never

from ..tc_components.instruction import Instruction, RegisterOp, MemoryOp, \
    ImmediateOp, LabelOp, AgenOp, FlagsOp, CondOp
from ..config import CONF

_SIGNATURE_CACHE: Dict[int, str] = {}


def _get_instruction_signature(instruction: Instruction) -> str:
    """
    Get a brief string representation of the instruction.
    Used as a unique identifier for the instruction when tracking coverage.
    """
    inst_identifier = id(instruction)

    # Cache the brief string to avoid recomputing it
    if inst_identifier in _SIGNATURE_CACHE:
        return _SIGNATURE_CACHE[inst_identifier]

    # Compute the brief string
    brief = instruction.name
    for o in instruction.operands:
        if isinstance(o, RegisterOp):
            brief += f" R{o.width}"
        elif isinstance(o, MemoryOp):
            brief += f" M{o.width}"
        elif isinstance(o, ImmediateOp):
            brief += f" I{o.width}"
        elif isinstance(o, LabelOp):
            brief += " L"
        elif isinstance(o, AgenOp):
            brief += f" A{o.width}"
        elif isinstance(o, FlagsOp):
            brief += " F"
        elif isinstance(o, CondOp):
            brief += " C"

        else:
            assert_never(o)

    _SIGNATURE_CACHE[inst_identifier] = brief
    return brief


class InstructionCoverage:
    """
    Tracks coverage of instructions executed on the model during a fuzzing campaign.
    """
    _cov: Dict[str, int]
    """ instruction coverage of the entire campaign """

    _local_cov: Optional[Dict[str, int]] = None
    """ instruction coverage of the current test case """

    def __init__(self) -> None:
        self._cov = defaultdict(int)

    def start_test_case(self) -> None:
        """
        Start tracking coverage for a new test case when CONF.coverage_type == "model_instructions".
        Otherwise, disable coverage tracking.
        """

        if CONF.coverage_type == "model_instructions":
            self._local_cov = defaultdict(int)
            return

        self._local_cov = None

    def add_instruction(self, inst: Instruction) -> None:
        """ Record the given instruction as covered (if coverage tracking is enabled) """
        if self._local_cov is None:
            return
        if inst.is_instrumentation:
            return
        self._local_cov[_get_instruction_signature(inst)] += 1

    def finish_test_case(self) -> None:
        """ Finish tracking coverage for the current test case """
        if self._local_cov is None:
            return

        for inst_name in self._local_cov.keys():
            self._cov[inst_name] += 1

    def report(self, path: str) -> None:
        """ Write the coverage data to a file """
        # Ensure that the last test case is included in the coverage report
        self.finish_test_case()

        # Sort the instructions by coverage count and write them to the file
        inst_names = sorted(self._cov.items(), key=lambda x: x[1], reverse=True)
        with open(path, "w") as f:
            for inst_name, count in inst_names:
                f.write(f"{inst_name:<20} {count}\n")
            if not inst_names:
                f.write("    No coverage data available")


================================================
FILE: rvzr/model_unicorn/execution_context.py
================================================
"""
File: Execution state of the model during a single test case execution

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import TYPE_CHECKING, Final, Optional, Dict, Tuple

from unicorn import Uc
from ..sandbox import SandboxLayout, CodeArea
from ..tc_components.actor import ActorID

if TYPE_CHECKING:
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.instruction import Instruction
    from ..tc_components.actor import Actor
    from ..target_desc import TargetDesc

PAGE_PERMISSION_MAP = Dict[ActorID, Tuple[bool, bool]]
""" Data type for storing page permissions for actors """


class ModelExecutionState:
    """
    Set of state variables that track a single execution of a test case program with a given
    input on the model
    """

    current_instruction: Instruction
    """ The instruction currently being executed by the model """

    current_actor: Actor
    """ The actor whose code is currently being executed by the model """

    exit_addr: int
    """ The address of the exit instruction in the current test case """

    fault_handler_addr: int
    """ The address of the fault handler in the current test case """

    pending_fault: int = 0
    """ Interface to signal pending soft faults to the model;
    If a fault was triggered but not handled yet, its ID is stored here """

    previous_context: Optional[object] = None
    """ Context of the emulator before the current instruction was executed;
    used to patch a bug in Unicorn """

    had_arch_fault: bool = False
    """ Indicates whether the model has already had a non-speculative fault in the current run """

    page_permissions: Optional[PAGE_PERMISSION_MAP] = None
    """ Dictionary of the page permissions for each actor at the start of execution.
    Only contains permissions on the faulty area, as all other areas are always RW."""

    _test_case: Final[TestCaseProgram]  # The test case being currently executed by the model
    _layout: Final[SandboxLayout]  # The layout of the sandbox

    def __init__(self, test_case: TestCaseProgram, layout: SandboxLayout, target_desc: TargetDesc):
        self._test_case = test_case
        self._layout = layout

        self.exit_addr = self._layout.get_exit_addr(test_case)
        self._set_fault_handler_addr(target_desc.macro_specs["fault_handler"].type_)
        self.full_reset()

    def full_reset(self) -> None:
        """ Complete reset of the model state; has to be called before each test case """
        self.had_arch_fault = False
        self.pending_fault = 0
        self.current_actor = self._test_case.find_actor(name="main")

    def reset_after_em_stop(self, start_pc: int) -> None:
        """
        Reset the model state after the emulator stops;
        has to be called before each start of the emulator iteration
        :param start_pc: the address where the emulator will start execution
        :return: None
        """
        self.pending_fault = 0
        aid = self._layout.code_addr_to_actor_id(start_pc)
        self.current_actor = self._test_case.find_actor(actor_id=aid)

    def is_exit_addr(self, address: int) -> bool:
        """ Check if the given address is the exit address """
        return address == self.exit_addr or \
            (self.current_actor.is_main and address > self.exit_addr)

    def update_context(self, em: Uc, address: int) -> None:
        """ Update the state of the model after each instruction """
        self.previous_context = em.context_save()
        aid = self.current_actor.get_id()
        section_start = self._layout.get_code_addr(CodeArea.MAIN, aid)
        instruction_map = self._test_case.get_obj().instruction_map()
        self.current_instruction = instruction_map[aid][address - section_start]

    def current_test_case(self) -> TestCaseProgram:
        """ Return the current test case being executed """
        return self._test_case

    def _set_fault_handler_addr(self, fh_id: int) -> None:
        test_case_obj = self._test_case.get_obj()
        code_start = self._layout.code_start()
        offset = test_case_obj.get_macro_offset(fh_id)
        if offset == -1:
            self.fault_handler_addr = self.exit_addr
            return

        self.fault_handler_addr = code_start + offset


================================================
FILE: rvzr/model_unicorn/interpreter.py
================================================
"""
File: Abstract interface and architecture-specific implementation of the extra interpreter logic.

      The extra interpreter is a component that provides additional interpretation
      logic over the one provided by Unicorn.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from abc import ABC, abstractmethod
from typing import TYPE_CHECKING, Tuple, Dict, Callable, Set, Optional, List, Final

from unicorn import UC_ERR_NOMEM, UcError, UC_ERR_EXCEPTION, UC_MEM_WRITE, UC_ERR_INSN_INVALID, \
    UC_ERR_READ_PROT, UC_ERR_WRITE_PROT
import unicorn.x86_const as x86ucc  # type: ignore  # no type hints available

from ..tc_components.actor import ActorMode, ActorPL, Actor, ActorID, PTEMask
from ..sandbox import CodeArea, DataArea
from ..logs import warning

if TYPE_CHECKING:
    from .model import UnicornModel
    from .execution_context import ModelExecutionState
    from ..target_desc import TargetDesc, UnicornTargetDesc
    from ..tc_components.instruction import Instruction
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.test_case_binary import SymbolTableEntry
    from ..tc_components.test_case_data import InputData

CRITICAL_ERROR = UC_ERR_NOMEM  # the model never handles this error, hence it will always crash


# ==================================================================================================
# Public Interface
# ==================================================================================================
class ExtraInterpreter(ABC):
    """
    Wrapper class that implements extra interpretation logic over the one provided by Unicorn.
    This, for example, includes the interpretation of macros and emulation of CPU modes.

    This class provides a generic interface, which is instantiated by the ISA-specific subclasses.
    """
    _model: Final[UnicornModel]
    _target_desc: Final[TargetDesc]
    _uc_target_desc: Final[UnicornTargetDesc]

    def __init__(self, target_desc: TargetDesc, model: UnicornModel):
        self._target_desc = target_desc
        self._model = model
        self._uc_target_desc = target_desc.uc_target_desc

    @abstractmethod
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """ Load the test case into the interpreter """

    @abstractmethod
    def load_input(self, input_: InputData) -> None:
        """ Load the input into the interpreter """

    def interpret_instruction(self, address: int, state: ModelExecutionState) -> None:
        """ Interpret the current instruction (stored in state.current_instruction) """
        instruction = state.current_instruction

        if instruction.name == "macro":
            self._interpret_macro(instruction, address)

        # emulate invalid opcode for certain instructions when executed in VM guest mode
        if state.current_actor.mode == ActorMode.GUEST:
            self._emulate_vm_execution(address)
        elif state.current_actor.privilege_level == ActorPL.USER:
            self._emulate_userspace_execution(address)

    def interpret_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        """ Interpret the given memory access """

    @abstractmethod
    def _interpret_macro(self, macro: Instruction, pc: int) -> None:
        """ Emulate execution of a macro instruction """

    @abstractmethod
    def _emulate_vm_execution(self, address: int) -> None:
        """ Emulate the execution of an instruction in VM guest mode """

    @abstractmethod
    def _emulate_userspace_execution(self, address: int) -> None:
        """ Emulate the execution of an instruction in userspace mode """


# ==================================================================================================
# Architecture-specific Implementations
# ==================================================================================================
class X86ExtraInterpreter(ExtraInterpreter):
    """ ExtraInterpreter implementation for the x86 architecture """

    _macro_interpreter: _X86MacroInterpreter
    _vm_interpreter: _X86VMInterpreter
    _userspace_interpreter: _X86UserspaceInterpreter
    _fault_interpreter: _X86FaultInterpreter

    def __init__(self, target_desc: TargetDesc, model: UnicornModel):
        super().__init__(target_desc, model)
        self._macro_interpreter = _X86MacroInterpreter(model, target_desc)
        self._vm_interpreter = _X86VMInterpreter(model, target_desc)
        self._userspace_interpreter = _X86UserspaceInterpreter(model, target_desc)
        self._fault_interpreter = _X86FaultInterpreter(model, target_desc)

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        self._macro_interpreter.load_test_case(test_case)
        self._fault_interpreter.load_test_case(test_case)
        self._vm_interpreter.reset()
        self._userspace_interpreter.reset()

    def load_input(self, input_: InputData) -> None:
        self._fault_interpreter.load_input(input_)

    def interpret_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        super().interpret_mem_access(access, address, size, value)
        self._fault_interpreter.induce_user_faults(self._model.state.current_actor, address)

    def _interpret_macro(self, macro: Instruction, pc: int) -> None:
        self._macro_interpreter.interpret(macro, pc)

    def _emulate_vm_execution(self, address: int) -> None:
        self._vm_interpreter.interpret(self._model.state.current_instruction, address)

    def _emulate_userspace_execution(self, address: int) -> None:
        self._userspace_interpreter.interpret(self._model.state.current_instruction, address)


class ARMExtraInterpreter(ExtraInterpreter):
    """ ExtraInterpreter implementation for the arm architecture """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel):
        super().__init__(target_desc, model)
        self._macro_interpreter = _ARM64MacroInterpreter(model, target_desc)
        self._fault_interpreter = _ARM64FaultInterpreter(model, target_desc)

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        self._macro_interpreter.load_test_case(test_case)
        self._fault_interpreter.load_test_case(test_case)

    def load_input(self, input_: InputData) -> None:
        self._fault_interpreter.load_input(input_)

    def interpret_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        super().interpret_mem_access(access, address, size, value)
        self._fault_interpreter.emulate_crossing_fault(access, address, size)

    def _interpret_macro(self, macro: Instruction, pc: int) -> None:
        self._macro_interpreter.interpret(macro, pc)

    def _emulate_vm_execution(self, address: int) -> None:
        pass

    def _emulate_userspace_execution(self, address: int) -> None:
        pass


# ==================================================================================================
# Private: Macro Interpretation
# ==================================================================================================

_MacroCallback = Callable[[int, int, int, int], None]


class _MacroInterpreterCommon:
    """ Implementation of architecture-independent macros and common logic """
    _model: UnicornModel
    _uc_target_desc: UnicornTargetDesc

    _test_case: Optional[TestCaseProgram] = None
    _function_table: List[SymbolTableEntry]
    _macro_table: List[SymbolTableEntry]
    _macro_callbacks: Dict[str, _MacroCallback]

    _curr_targets: Dict[str, int]
    _sid_to_actor: Dict[int, Actor]

    def __init__(self, model: UnicornModel, target_desc: TargetDesc):
        self._model = model
        self._uc_target_desc = target_desc.uc_target_desc
        self._function_table = []
        self._macro_table = []
        self._curr_targets = {
            "h2g": 0,
            "g2h": 0,
            "k2u": 0,
            "u2k": 0,
        }
        self._macro_callbacks = {
            "measurement_start": self._macro_measurement_start,
            "measurement_end": self._macro_measurement_end,
            "switch": self._macro_switch,
            "fault_handler": lambda *_: None,
        }

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """ Load the test case into the interpreter """
        self._test_case = test_case
        test_case_obj = test_case.get_obj()
        symbol_table = test_case_obj.symbol_table()

        self._function_table = [sym for sym in symbol_table if sym.type_ == 0]
        self._function_table.sort(key=lambda s: [s.arg])
        self._macro_table = [sym for sym in symbol_table if sym.type_ != 0]
        self._sid_to_actor = {actor.get_id(): actor for actor in test_case.get_actors()}

    def interpret(self, macro: Instruction, pc: int) -> None:
        """
        Interpret the given macro instruction and execute the corresponding logic on the model
        """
        actor_id = self._model.state.current_actor.get_id()
        macro_start = self._model.layout.get_code_addr(CodeArea.MAIN, actor_id)
        macro_offset = pc - macro_start
        macro_args = self._get_macro_args(actor_id, macro_offset)
        macro_name = macro.operands[0].value.lower()[1:]
        if macro_name not in self._macro_callbacks:
            warning("interpret", f"unknown macro: {macro_name}")
            raise UcError(CRITICAL_ERROR)

        interpreter_func = self._macro_callbacks[macro_name]
        interpreter_func(*macro_args)

    def _get_macro_args(self, section_id: int, section_offset: int) -> Tuple[int, int, int, int]:
        # find the macro entry in the symbol table
        for symbol in self._macro_table:
            if symbol.sid == section_id and symbol.offset == section_offset:
                args = symbol.arg
                return args & 0xFFFF, (args >> 16) & 0xFFFF, (args >> 32) & 0xFFFF, \
                    (args >> 48) & 0xFFFF
        warning("get_macro_args", "macro not found in symbol table")
        raise UcError(CRITICAL_ERROR)

    def _find_function_by_id(self, function_id: int) -> SymbolTableEntry:
        if function_id < 0 or function_id >= len(self._function_table):
            warning("find_function_by_id", "function not found in symbol table")
            raise UcError(CRITICAL_ERROR)
        return self._function_table[function_id]

    def _macro_measurement_start(self, _: int, __: int, ___: int, ____: int) -> None:
        if not self._model.speculator.in_speculation():
            self._model.tracer.enable_tracing = True

    def _macro_measurement_end(self, _: int, __: int, ___: int, ____: int) -> None:
        if not self._model.speculator.in_speculation():
            self._model.tracer.enable_tracing = False

    def _macro_switch(self, section_id: int, function_id: int, _: int, __: int) -> None:
        """
        Switch the active actor, update data area base and SP,
          and jump to the corresponding function address
        """
        model = self._model
        layout = model.layout

        # PC update
        section_addr = layout.get_code_addr(CodeArea.MAIN, section_id)
        function_symbol = self._find_function_by_id(function_id)
        function_addr = section_addr + function_symbol.offset
        model.emulator.reg_write(self._uc_target_desc.pc_register, function_addr)

        # data area base and SP update
        new_base = layout.get_data_addr(DataArea.MAIN, section_id)
        new_sp = layout.get_data_addr(DataArea.RSP_INIT, section_id)
        model.emulator.reg_write(self._uc_target_desc.actor_base_register, new_base)
        model.emulator.reg_write(self._uc_target_desc.sp_register, new_sp)

        # actor update
        model.state.current_actor = self._sid_to_actor[section_id]


class _X86MacroInterpreter(_MacroInterpreterCommon):
    """ Implements the interpretation of x86-specific macros """
    _pseudo_lstar: int
    _is_amd: bool

    def __init__(self, model: UnicornModel, target_desc: TargetDesc):
        super().__init__(model, target_desc)
        self._is_amd = target_desc.cpu_desc.vendor == "AMD"
        self._macro_callbacks.update({
            "switch_k2u": self._macro_switch_k2u,
            "switch_u2k": self._macro_switch_u2k,
            "set_k2u_target": self._macro_set_k2u_target,
            "set_u2k_target": self._macro_set_u2k_target,
            "switch_h2g": self._macro_switch_h2g,
            "switch_g2h": self._macro_switch_g2h,
            "set_h2g_target": self._macro_set_h2g_target,
            "set_g2h_target": self._macro_set_g2h_target,
            "landing_k2u": self._macro_landing_k2u,
            "landing_u2k": self._macro_landing_u2k,
            "landing_h2g": self._macro_landing_h2g,
            "landing_g2h": self._macro_landing_g2h,
            "set_data_permissions": self._macro_set_data_permissions,
        })

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        super().load_test_case(test_case)
        self._pseudo_lstar = self._model.state.exit_addr

    def _macro_set_k2u_target(self, section_id: int, function_id: int, _: int, __: int) -> None:
        """
        Decode arguments and store destination into _curr_target
        """
        section_addr = self._model.layout.get_code_addr(CodeArea.MAIN, section_id)
        function_symbol = self._find_function_by_id(function_id)
        function_addr = section_addr + function_symbol.offset
        self._curr_targets["k2u"] = function_addr

    def _macro_switch_k2u(self, section_id: int, _: int, __: int, ___: int) -> None:
        """ Read the destination from _curr_target and jump to it;
        also update data area base and SP """
        model = self._model
        layout = model.layout

        # PC update
        model.emulator.reg_write(self._uc_target_desc.pc_register, self._curr_targets["k2u"])

        # side effects
        # flags = model.emulator.reg_read(x86ucc.UC_X86_REG_EFLAGS)
        # rsp = model.emulator.reg_read(x86ucc.UC_X86_REG_RSP)
        # model.emulator.mem_write(rsp - 8, flags.to_bytes(8, byteorder='little'))  # type: ignore

        # data area base and SP update
        new_base = layout.get_data_addr(DataArea.MAIN, section_id)
        new_sp = layout.get_data_addr(DataArea.RSP_INIT, section_id)
        model.emulator.reg_write(self._uc_target_desc.actor_base_register, new_base)
        model.emulator.reg_write(x86ucc.UC_X86_REG_RSP, new_sp)

        # actor update
        model.state.current_actor = self._sid_to_actor[section_id]

    def _macro_set_u2k_target(self, section_id: int, function_id: int, _: int, __: int) -> None:
        """ Set LSTAR to the target address if in kernel mode; otherwise, throw an exception """
        if self._model.state.current_actor.privilege_level != ActorPL.KERNEL:
            self._model.do_soft_fault(UC_ERR_EXCEPTION)
            return
        model = self._model

        # update LSTAR
        section_addr = model.layout.get_code_addr(CodeArea.MAIN, section_id)
        function_symbol = self._find_function_by_id(function_id)
        function_addr = section_addr + function_symbol.offset
        self._pseudo_lstar = function_addr

    def _macro_switch_u2k(self, section_id: int, _: int, __: int, ___: int) -> None:
        """ Switch the active actor, update data area base and SP, and jump to
            the _pseudo_lstar
        """
        model = self._model

        # PC update
        model.emulator.reg_write(self._uc_target_desc.pc_register, self._pseudo_lstar)

        # data area base and SP update
        new_base = model.layout.get_data_addr(DataArea.MAIN, section_id)
        new_sp = model.layout.get_data_addr(DataArea.RSP_INIT, section_id)
        model.emulator.reg_write(self._uc_target_desc.actor_base_register, new_base)
        model.emulator.reg_write(x86ucc.UC_X86_REG_RSP, new_sp)

        # actor update
        model.state.current_actor = self._sid_to_actor[section_id]

    def _macro_switch_h2g(self, section_id: int, _: int, __: int, ___: int) -> None:
        model = self._model

        # PC update
        model.emulator.reg_write(self._uc_target_desc.pc_register, self._curr_targets["h2g"])

        # data area base and SP update
        new_base = model.layout.get_data_addr(DataArea.MAIN, section_id)
        new_sp = model.layout.get_data_addr(DataArea.RSP_INIT, section_id)
        model.emulator.reg_write(self._uc_target_desc.actor_base_register, new_base)
        model.emulator.reg_write(x86ucc.UC_X86_REG_RSP, new_sp)

        # reset flags
        model.emulator.reg_write(x86ucc.UC_X86_REG_EFLAGS, 0b10)

        # actor update
        model.state.current_actor = self._sid_to_actor[section_id]

        # AMD VMRUN clobbers RAX; we model it as a zero write to RAX
        if self._is_amd:
            model.emulator.reg_write(x86ucc.UC_X86_REG_RAX, 0)

    def _macro_switch_g2h(self, section_id: int, _: int, __: int, ___: int) -> None:
        model = self._model

        # PC update
        model.emulator.reg_write(self._uc_target_desc.pc_register, self._curr_targets["g2h"])

        # data area base and SP update
        new_base = model.layout.get_data_addr(DataArea.MAIN, section_id)
        new_sp = model.layout.get_data_addr(DataArea.RSP_INIT, section_id)
        model.emulator.reg_write(self._uc_target_desc.actor_base_register, new_base)
        model.emulator.reg_write(x86ucc.UC_X86_REG_RSP, new_sp)

        # actor update
        model.state.current_actor = self._sid_to_actor[section_id]

        # AMD VMEXIT clobbers RAX; we model it as a zero write to RAX
        if self._is_amd:
            model.emulator.reg_write(x86ucc.UC_X86_REG_RAX, 0)

    def _macro_set_h2g_target(self, section_id: int, function_id: int, _: int, __: int) -> None:
        section_addr = self._model.layout.get_code_addr(CodeArea.MAIN, section_id)
        function_symbol = self._find_function_by_id(function_id)
        function_addr = section_addr + function_symbol.offset
        self._curr_targets["h2g"] = function_addr

    def _macro_set_g2h_target(self, section_id: int, function_id: int, _: int, __: int) -> None:
        section_addr = self._model.layout.get_code_addr(CodeArea.MAIN, section_id)
        function_symbol = self._find_function_by_id(function_id)
        function_addr = section_addr + function_symbol.offset
        self._curr_targets["g2h"] = function_addr

    def _macro_landing_k2u(self, _: int, __: int, ___: int, ____: int) -> None:
        """ Landing for the k2u switch """
        self._model.emulator.reg_write(x86ucc.UC_X86_REG_RCX, 0)

    def _macro_landing_u2k(self, _: int, __: int, ___: int, ____: int) -> None:
        """ Landing for the u2k switch """
        self._model.emulator.reg_write(x86ucc.UC_X86_REG_RCX, 0)

    def _macro_landing_h2g(self, _: int, __: int, ___: int, ____: int) -> None:
        """ Landing for the h2g switch """

    def _macro_landing_g2h(self, _: int, __: int, ___: int, ____: int) -> None:
        """ Landing for the g2h switch """

    def _macro_set_data_permissions(self, actor_id: int, must_set: int, must_clear: int,
                                    _: int) -> None:
        """ Manual setting of data permissions for the actor """


class _ARM64MacroInterpreter(_MacroInterpreterCommon):
    """ Implements the interpretation of ARM64-specific macros """

    def __init__(self, model: UnicornModel, target_desc: TargetDesc):
        super().__init__(model, target_desc)
        self._is_amd = target_desc.cpu_desc.vendor == "AMD"
        self._macro_callbacks.update({
            "fault_handler": lambda *_: None,
        })


# ==================================================================================================
# Private: VM mode and Userspace Emulation
# ==================================================================================================
class _X86VMInterpreter:
    """ Adds the ability to emulate VM guest execution to the Unicorn emulator """

    safe_address_cache: Set[int]
    always_exit_instructions: Set[str] = {
        "cpuid", "getsec", "xgetbv", "xsetbv", "xrstors", "xsaves", "invd", "invept", "invvpid",
        "vmptrld", "vmptrst", "vmclear", "vmxon", "vmxoff", "vmlaunch", "vmresume", "vmcall",
        "vmfunc", "hlt", "invlpg", "invpcid", "lgdt", "lidt", "lldt", "ltr", "sgdt", "sidt", "sldt",
        "str", "loadiwkey", "monitor", "mwait", "rdpmc", "rdrand", "rdseed", "rdtsc", "rdtscp",
        "rsm", "tpause", "umwait", "vmread", "vmwrite", "wbinvd", "wbnoinvd", "wrmsr", "fxsave",
        "fxsave64", "in", "ins", "insb", "insw", "insd", "out", "outs", "outsb", "outsw", "outsd",
        "pause", "rdmsr", "swapgs"
    }
    always_exiting_registers = ["cr0", "cr3", "cr8", "dr0", "dr1", "dr2", "dr3", "dr6", "dr7"]

    def __init__(self, model: UnicornModel, target_desc: TargetDesc) -> None:
        self._model = model
        self._uc_target_desc = target_desc.uc_target_desc
        self.safe_address_cache = set()

    def reset(self) -> None:
        """ Reset the state of the interpreter; MUST be called for every new test case """
        self.safe_address_cache.clear()

    def interpret(self, inst: Instruction, address: int) -> None:
        """ Interpret the given instruction """

        if address in self.safe_address_cache:
            return
        stripped_name = inst.name.split()[-1]

        # always-exiting instruction
        if stripped_name in self.always_exit_instructions:
            # make sure that the memory accesses get exposed
            if inst.has_mem_operand(True):
                ops = inst.get_mem_operands(True)
                for op in ops:
                    words = op.value.split("+")
                    for word in words:
                        reg = self._uc_target_desc.reg_str_to_constant.get(word.lower(), 0)
                        if reg:
                            value = int(self._model.emulator.reg_read(reg))  # type: ignore
                            self._model.tracer.observe_mem_access(UC_MEM_WRITE, value, 8, 0)
            self._model.do_soft_fault(UC_ERR_INSN_INVALID)
            return

        # conditional exit
        if stripped_name == "mov":
            if not self._emulate_move(inst, address):
                return

        # safe instruction
        self.safe_address_cache.add(address)

    def _emulate_move(self, inst: Instruction, _: int) -> bool:
        for operand in inst.operands:
            if operand.value in self.always_exiting_registers:
                self._model.do_soft_fault(UC_ERR_INSN_INVALID)
                return False
        return True


class _X86UserspaceInterpreter(_X86VMInterpreter):
    """
    Adds the ability to emulate user-space execution to the Unicorn emulator.
    """
    always_exit_instructions: Set[str] = {
        "cpuid", "rdmsr", "wrmsr", "rdtsc", "rdtscp", "clac", "stac", "clgi", "stgi", "clts", "htl",
        "invd", "invlpg", "invlpga", "invlpgb", "invpcid", "lgdt", "lldt", "lidt", "ltr", "sgdt",
        "sidt", "sldt", "str", "psmash", "pvalidate", "rmpadjust", "rmpquery", "rmpupdate",
        "skinit", "sysretq", "sysexitq", "tlbsync", "vmmcall", "vmload", "vmsave", "vmrun",
        "wbinvd", "wbnoinvd", "smsw", "lmsw", "rdfsbase", "rdgsbase", "wrfsbase", "wrgsbase",
        "swapgs", "vmclear", "vmlaunch", "vmptrld", "vmptrst", "vmread", "vmresume", "vmwrite",
        "vmxoff", "invvpid", "getsec", "loadiwkey", "pconfig", "encls", "enclv", "hlt", "xgetbv",
        "xsetbv"
    }
    always_exiting_registers = [
        "cr0", "cr2", "cr3", "cr8", "dr0", "dr1", "dr2", "dr3", "dr6", "dr7"
    ]


# ==================================================================================================
# Private: Fault Handling and Permissions
# ==================================================================================================
class _FaultInterpreterCommon(ABC):
    """ Class that handles page faults and permissions in the emulator """
    _model: UnicornModel
    _target_desc: TargetDesc
    _uc_target_desc: UnicornTargetDesc
    _test_case: Optional[TestCaseProgram] = None

    _faulty_page_readable: Dict[ActorID, bool]
    _faulty_page_writable: Dict[ActorID, bool]
    _faulty_page_user_accessible: Dict[ActorID, bool]
    _main_page_user_accessible: Dict[ActorID, bool]

    def __init__(self, model: UnicornModel, target_desc: TargetDesc):
        self._model = model
        self._target_desc = target_desc
        self._uc_target_desc = target_desc.uc_target_desc

    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """ Load the test case into the interpreter """
        self._test_case = test_case
        self._faulty_page_readable = {}
        self._faulty_page_writable = {}
        self._faulty_page_user_accessible = {}
        self._main_page_user_accessible = {}
        for actor in test_case.get_actors(sorted_=True):
            aid = actor.get_id()

            pte: PTEMask = actor.data_properties
            self._faulty_page_readable[aid] = self._page_is_readable(pte)
            self._faulty_page_writable[aid] = self._page_is_writable(pte)
            self._faulty_page_user_accessible[aid] = self._page_is_user_accessible(pte)
            self._main_page_user_accessible[aid] = actor.privilege_level == ActorPL.USER

            if actor.mode == ActorMode.GUEST:
                epte: PTEMask = actor.data_ept_properties
                self._faulty_page_readable[aid] &= self._extended_page_is_readable(epte)
                self._faulty_page_writable[aid] &= self._extended_page_is_writable(epte)
                # NOTE: EPT user-accessible bit is not supported yet

        # make the permissions available to other components of the model
        self._model.state.page_permissions = {}
        for actor_id in range(test_case.n_actors()):
            self._model.state.page_permissions[actor_id] = (self._faulty_page_readable[actor_id],
                                                            self._faulty_page_writable[actor_id])

    def load_input(self, _: InputData) -> None:
        """ Set memory permissions for the given input """
        assert self._test_case is not None

        # Set memory permissions
        for actor_id in range(self._test_case.n_actors()):
            if not self._faulty_page_readable[actor_id]:
                self._model.set_faulty_area_rw(actor_id, False, False)
            elif not self._faulty_page_writable[actor_id]:
                self._model.set_faulty_area_rw(actor_id, True, False)

    def induce_user_faults(self, current_actor: Actor, address: int) -> None:
        """
        Induce page faults for user/kernel access based on the page permissions
        and the current execution mode
        """
        # identify the target page privilege level
        if not self._model.layout.is_data_addr(address):
            return
        target_aid = self._model.layout.data_addr_to_actor_id(address)
        faulty_area_start = self._model.layout.get_data_addr(DataArea.FAULTY, target_aid)
        is_faulty_page = (address & 0xFFFFFFFFFFFFF000) == faulty_area_start
        target_page_is_user = self._faulty_page_user_accessible[target_aid] \
            if is_faulty_page else self._main_page_user_accessible[target_aid]

        # user actors produce faults when accessing data from kernel space
        if current_actor.privilege_level == ActorPL.USER and not target_page_is_user:
            self._model.do_soft_fault(13)
            return

        # kernel actors produce faults when accessing data of user actors
        # NOTE: this code assumes that SMAP is enabled, which may or may not be the case in practice
        if current_actor.privilege_level == ActorPL.KERNEL and target_page_is_user:
            self._model.do_soft_fault(13)

    @abstractmethod
    def _page_is_readable(self, pet: PTEMask) -> bool:
        """ Check if the page is readable according to the PTE bits """

    @abstractmethod
    def _page_is_writable(self, pet: PTEMask) -> bool:
        """ Check if the page is writable according to the PTE bits """

    @abstractmethod
    def _page_is_user_accessible(self, pet: PTEMask) -> bool:
        """ Check if the page is user-accessible according to the PTE bits """

    @abstractmethod
    def _extended_page_is_readable(self, epet: PTEMask) -> bool:
        """ Check if the page is readable according to the EPTE bits """

    @abstractmethod
    def _extended_page_is_writable(self, epet: PTEMask) -> bool:
        """ Check if the page is writable according to the EPTE bits """


class _X86FaultInterpreter(_FaultInterpreterCommon):
    """ Implements page fault handling and permission checking for the x86 architecture """

    def _page_is_readable(self, pet: PTEMask) -> bool:
        pte_desc = self._target_desc.pte_bits
        if (pet & (1 << pte_desc["present"][0])) == 0:
            return False
        if (pet & (1 << pte_desc["accessed"][0])) == 0:
            return False
        if (pet & (1 << pte_desc["reserved_bit"][0])) != 0:
            return False
        return True

    def _page_is_writable(self, pet: PTEMask) -> bool:
        pte_desc = self._target_desc.pte_bits
        if (pet & (1 << pte_desc["writable"][0])) == 0:
            return False
        if (pet & (1 << pte_desc["dirty"][0])) == 0:
            return False
        return True

    def _page_is_user_accessible(self, pet: PTEMask) -> bool:
        pte_desc = self._target_desc.pte_bits
        if (pet & (1 << pte_desc["user"][0])) == 0:
            return False
        return True

    def _extended_page_is_readable(self, epet: PTEMask) -> bool:
        epte_desc = self._target_desc.vm_pte_bits
        if (epet & (1 << epte_desc["present"][0])) == 0:
            return False
        if (epet & (1 << epte_desc["accessed"][0])) == 0:
            return False
        if (epet & (1 << epte_desc["reserved_bit"][0])) != 0:
            return False
        return True

    def _extended_page_is_writable(self, epet: PTEMask) -> bool:
        epte_desc = self._target_desc.vm_pte_bits
        if (epet & (1 << epte_desc["writable"][0])) == 0:
            return False
        if (epet & (1 << epte_desc["dirty"][0])) == 0:
            return False
        return True


class _ARM64FaultInterpreter(_FaultInterpreterCommon):
    """ Implements page fault handling and permission checking for the ARM64 architecture """

    def _page_is_readable(self, pet: PTEMask) -> bool:
        pte_desc = self._target_desc.pte_bits
        if (pet & (1 << pte_desc["valid"][0])) == 0:
            return False
        return True

    def _page_is_writable(self, pet: PTEMask) -> bool:
        pte_desc = self._target_desc.pte_bits
        if (pet & (1 << pte_desc["non_writable"][0])) != 0:
            return False
        return True

    def _page_is_user_accessible(self, pet: PTEMask) -> bool:
        return True  # FIXME: implement user/supervisor bit check

    def _extended_page_is_readable(self, epet: PTEMask) -> bool:
        return True

    def _extended_page_is_writable(self, epet: PTEMask) -> bool:
        return True

    def emulate_crossing_fault(self, access: int, address: int, size: int) -> None:
        """
        Workaround: Unicorn does not trigger a fault if the memory access crosses a page
        boundary and the first page is accessible but the second is not
        """
        # No need for the workaround if the access is within a page
        if address % 0x1000 + size < 0x1000:
            return

        # Also does not apply if the crossing goes to any other page than the faulty area
        layout = self._model.layout
        access_end = address + size - 1
        actor_id = layout.data_addr_to_actor_id(address)
        if actor_id == -1:
            return
        faulty_base = layout.get_data_addr(DataArea.FAULTY, actor_id)
        faulty_end = faulty_base + layout.data_area_size(DataArea.FAULTY)
        if access_end < faulty_base or access_end >= faulty_end:
            return

        # Emulate a fault if the faulty area is non-readable/non-writable
        if not self._faulty_page_readable[actor_id]:
            self._model.do_soft_fault(UC_ERR_READ_PROT)
            return
        if access == UC_MEM_WRITE and not self._faulty_page_writable[actor_id]:
            self._model.do_soft_fault(UC_ERR_WRITE_PROT)
            return


================================================
FILE: rvzr/model_unicorn/model.py
================================================
"""
File: Unicorn-based backend to the contract model.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

from __future__ import annotations
from abc import ABC, abstractmethod
from typing import List, Tuple, Optional, Set, TYPE_CHECKING, Final, Dict, Type

import numpy as np

import unicorn as uc
import unicorn.x86_const as x86ucc  # type: ignore # no type hints for unicorn.x86_const
import unicorn.arm64_const as armucc  # type: ignore # no type hints for unicorn.arm_const
from unicorn import Uc, UC_HOOK_CODE, UC_HOOK_MEM_READ, UC_HOOK_MEM_WRITE, \
    UC_HOOK_MEM_UNMAPPED, UcError, UC_MEM_WRITE, UC_PROT_NONE, UC_PROT_READ

from ..model import Model
from ..sandbox import SandboxLayout, DataArea
from ..config import CONF
from ..logs import ModelLogger, BLUE, COL_RESET, error
from ..traces import CTraceEntry

from .taint_tracker import UnicornTaintTracker
from .coverage import InstructionCoverage
from .execution_context import ModelExecutionState

if TYPE_CHECKING:
    from ..tc_components.test_case_data import InputData
    from ..tc_components.test_case_data import InputTaint
    from ..tc_components.test_case_code import TestCaseProgram
    from ..traces import CTrace
    from .tracer import UnicornTracer
    from .speculator_abc import UnicornSpeculator
    from .interpreter import ExtraInterpreter
    from ..target_desc import TargetDesc, UnicornTargetDesc
    from ..sandbox import BaseAddrTuple


_UC_FAULT_MAPPING: Final[Dict[str, List[int]]] = {  # map fault names to Unicorn fault IDs
    "DE": [21],
    "DB": [10],
    "BP": [21],
    "BR": [13],
    "UD": [10],
    "PF": [12, 13],
    "GP": [6, 7],
    "assist": [12, 13],
}


# ==================================================================================================
# Private classes and functions
# ==================================================================================================
class _Dispatcher:
    """
    Class responsible for invoking callback functions in service classes upon events in Unicorn
    """
    coverage: InstructionCoverage
    _taint_tracker: UnicornTaintTracker
    _tracer: UnicornTracer
    _speculator: UnicornSpeculator
    _interpreter: ExtraInterpreter

    def __init__(self, taint_tracker: UnicornTaintTracker, speculator: UnicornSpeculator,
                 tracer: UnicornTracer, interpreter: ExtraInterpreter,
                 coverage: InstructionCoverage) -> None:
        self._taint_tracker = taint_tracker
        self._tracer = tracer
        self._speculator = speculator
        self._interpreter = interpreter
        self.coverage = coverage

    def test_case_load_dispatch(self, test_case: TestCaseProgram) -> None:
        """ Call callbacks in service classes that need to be called when a test case is loaded """
        self._interpreter.load_test_case(test_case)
        self._tracer.load_test_case(test_case)
        self.coverage.finish_test_case()
        self.coverage.start_test_case()

    def execution_start_dispatch(self, input_: InputData) -> None:
        """ Call callbacks in service classes that need to be called before model execution """
        self._tracer.reset(input_)
        self._speculator.reset()
        self._taint_tracker.reset()
        self._interpreter.load_input(input_)

    def instruction_dispatch(self, address: int, size: int, _: UnicornModel,
                             state: ModelExecutionState) -> None:
        """ Call instruction-related callbacks in service classes """

        if state.current_instruction.is_macro_placeholder:
            # Skip macro placeholders as they are not real instructions
            return

        # NOTE: the order of the following calls is important
        self._taint_tracker.track_instruction(state.current_instruction)
        self._tracer.observe_instruction(address, size)
        self._speculator.handle_instruction(address, size)
        self._interpreter.interpret_instruction(address, state)
        self.coverage.add_instruction(state.current_instruction)

    def mem_access_dispatch(self, access: int, address: int, size: int, value: int,
                            state: ModelExecutionState) -> None:
        """ Call memory access-related callbacks in service classes """

        if state.current_instruction.is_macro_placeholder:
            # Skip macro placeholders as they are not real instructions
            return

        # NOTE: the order of the following calls is important
        self._taint_tracker.track_memory_access(address, size, access == UC_MEM_WRITE)
        self._speculator.handle_mem_access(access, address, size, value)
        self._tracer.observe_mem_access(access, address, size, value)
        self._interpreter.interpret_mem_access(access, address, size, value)


def _instruction_hook(_: Uc, address: int, size: int, model: UnicornModel) -> None:
    """ Dispatch the Unicorn instruction hook to the model. """
    model.instruction_callback(address, size)


def _mem_access_hook(_: Uc, access: int, address: int, size: int, value: int,
                     model: UnicornModel) -> None:
    """ Dispatch the Unicorn memory access hook to the model. """
    model.mem_access_callback(access, address, size, value)


def _mem_unmapped_hook(_: Uc, access: int, address: int, size: int, value: int,
                       model: UnicornModel) -> None:
    """ Dispatch the Unicorn memory unmapped hook to the model. """
    model.mem_access_callback(access, address, size, value)


_ERR_DECODE = {
    uc.UC_ERR_OK: "OK (UC_ERR_OK)",
    uc.UC_ERR_NOMEM: "No memory available or memory not present (UC_ERR_NOMEM)",
    uc.UC_ERR_ARCH: "Invalid/unsupported architecture (UC_ERR_ARCH)",
    uc.UC_ERR_HANDLE: "Invalid handle (UC_ERR_HANDLE)",
    uc.UC_ERR_MODE: "Invalid mode (UC_ERR_MODE)",
    uc.UC_ERR_VERSION: "Different API version between core & binding (UC_ERR_VERSION)",
    uc.UC_ERR_READ_UNMAPPED: "Invalid memory read (UC_ERR_READ_UNMAPPED)",
    uc.UC_ERR_WRITE_UNMAPPED: "Invalid memory write (UC_ERR_WRITE_UNMAPPED)",
    uc.UC_ERR_FETCH_UNMAPPED: "Invalid memory fetch (UC_ERR_FETCH_UNMAPPED)",
    uc.UC_ERR_HOOK: "Invalid hook type (UC_ERR_HOOK)",
    uc.UC_ERR_INSN_INVALID: "Invalid instruction (UC_ERR_INSN_INVALID)",
    uc.UC_ERR_MAP: "Invalid memory mapping (UC_ERR_MAP)",
    uc.UC_ERR_WRITE_PROT: "Write to write-protected memory (UC_ERR_WRITE_PROT)",
    uc.UC_ERR_READ_PROT: "Read from non-readable memory (UC_ERR_READ_PROT)",
    uc.UC_ERR_FETCH_PROT: "Fetch from non-executable memory (UC_ERR_FETCH_PROT)",
    uc.UC_ERR_ARG: "Invalid argument (UC_ERR_ARG)",
    uc.UC_ERR_READ_UNALIGNED: "Read from unaligned memory (UC_ERR_READ_UNALIGNED)",
    uc.UC_ERR_WRITE_UNALIGNED: "Write to unaligned memory (UC_ERR_WRITE_UNALIGNED)",
    uc.UC_ERR_FETCH_UNALIGNED: "Fetch from unaligned memory (UC_ERR_FETCH_UNALIGNED)",
    uc.UC_ERR_RESOURCE: "Insufficient resource (UC_ERR_RESOURCE)",
    uc.UC_ERR_EXCEPTION: "Misc. CPU exception (UC_ERR_EXCEPTION)",
}


def _err_to_str(errno: int) -> str:
    if errno in _ERR_DECODE:
        return _ERR_DECODE[errno]
    return "Unknown error code"


# ==================================================================================================
# Public Interface: Architecture-independent Model
# ==================================================================================================
class UnicornModel(Model, ABC):
    """
    Basic architecture-independent implementation of a Unicorn-based model.
    This implementation does not support speculative execution; see UnicornSpec for that.
    """

    # pylint: disable=too-many-instance-attributes
    # This is a management class that connects many services together, so having many attributes
    # is a necessary evil

    # Service objects
    emulator: Uc
    tracer: Final[UnicornTracer]
    speculator: Final[UnicornSpeculator]
    _taint_tracker: UnicornTaintTracker
    _log: Final[ModelLogger]
    _dispatcher: Final[_Dispatcher]

    # Model state
    state: ModelExecutionState
    layout: SandboxLayout

    # Descriptors
    _bases: BaseAddrTuple
    _target_desc: Final[TargetDesc]
    _uc_target_desc: Final[UnicornTargetDesc]
    _architecture: Optional[Tuple[int, int]] = None  # (UC_ARCH, UC_MODE)
    _handled_faults: Set[int]  # The set of fault types that do NOT terminate execution

    # ----------------------------------------------------------------------------------------------
    # Constructor and Service Module Initialization
    def __init__(self,
                 bases: BaseAddrTuple,
                 target_desc: TargetDesc,
                 speculator_cls: Type[UnicornSpeculator],
                 tracer_cls: Type[UnicornTracer],
                 interpreter_cls: Type[ExtraInterpreter],
                 enable_mismatch_check_mode: bool = False) -> None:

        assert self._architecture is not None, \
            "Subclasses must define the `architecture` attribute before calling super().__init__"

        # Service modules
        self.emulator = Uc(*self._architecture)
        self._taint_tracker = UnicornTaintTracker(bases, target_desc)
        self.tracer = tracer_cls(target_desc, self, self._taint_tracker)
        self.speculator = speculator_cls(target_desc, self, self._taint_tracker)
        self._dispatcher = _Dispatcher(self._taint_tracker, self.speculator, self.tracer,
                                       interpreter_cls(target_desc, self), InstructionCoverage())
        self._target_desc = target_desc
        self._uc_target_desc = target_desc.uc_target_desc
        self._log = ModelLogger()

        # Set the base addresses and the mismatch check mode
        self._bases = bases
        self._enable_mismatch_check_mode = enable_mismatch_check_mode
        self.is_speculative = not self.speculator.is_sequential

        # Set the list of handled faults
        self._handled_faults = set()
        for fault in CONF._handled_faults:
            if fault in _UC_FAULT_MAPPING:
                self._handled_faults.update(_UC_FAULT_MAPPING[fault])
            else:
                raise NotImplementedError(f"Fault type {fault} is not supported")

    # ----------------------------------------------------------------------------------------------
    # Default Public Interface
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """
        Load the test case into the model. This method must be called before tracing
        the test case (trace_test_case or trace_test_case_with_taints).
        :param test_case: the test case to load
        :return: None
        :raises UcError: if an error occurs while loading the test case
        """
        test_case_obj = test_case.get_obj()

        # Load the test case into the service classes
        self.layout = SandboxLayout(self._bases, test_case.n_actors())
        self._log.set_model_layout(self.layout)
        self.state = ModelExecutionState(test_case, self.layout, self._target_desc)
        self._dispatcher.test_case_load_dispatch(test_case)

        # Create a new instance of the emulator
        assert self._architecture is not None, "_architecture must be set by subclass"
        self.emulator = Uc(*self._architecture)

        # Get binary representation of the test case
        code = test_case_obj.to_bytes(
            padded_section_size=self.layout.code_size_per_actor(), padding_byte=b'\x90')

        # Allocate memory and write the binary
        # Note: the data will be written later, by the _load_input method
        try:
            self.emulator.mem_map(self.layout.code_start(), self.layout.code_size)
            self.emulator.mem_map(self.layout.data_start(), self.layout.data_size)
            self.emulator.mem_write(self.layout.code_start(), code)
        except UcError as e:
            error(f"[UnicornModel:load_test_case] {e}")

        # Set up callbacks
        try:
            self.emulator.hook_add(UC_HOOK_MEM_READ | UC_HOOK_MEM_WRITE, _mem_access_hook, self)
            self.emulator.hook_add(UC_HOOK_MEM_UNMAPPED, _mem_unmapped_hook, self)
            self.emulator.hook_add(UC_HOOK_CODE, _instruction_hook, self)
        except UcError as e:
            error(f"[UnicornModel:load_test_case] {e}")

    def trace_test_case(self, inputs: List[InputData], nesting: int) -> List[CTrace]:
        """
        Execute the previously loaded test case with the inputs and collect the contract traces.
        :param inputs: the inputs to use for the test case
        :param nesting: the maximum number of speculative levels that will be simulated
        :return: list of collected contract traces, one per input
        """
        self._taint_tracker.set_enable_tracking(False)
        self.speculator.set_max_nesting(nesting)
        ctraces, _ = self._execute_test_case_with_inputs(inputs)
        return ctraces

    def trace_test_case_with_taints(self, inputs: List[InputData],
                                    nesting: int) -> Tuple[List[CTrace], List[InputTaint]]:
        """
        Executes the previously loaded test case with the inputs and collects the contract traces
        while also tracking taints.
        :param inputs: the inputs to use for the test case
        :param nesting: the maximum number of speculative levels that will be simulated
        :return: list of collected contract traces and the taints, one of each per input
        """
        self._taint_tracker.set_enable_tracking(True)
        self.speculator.set_max_nesting(nesting)
        ctraces, taints = self._execute_test_case_with_inputs(inputs)
        return ctraces, taints

    # ----------------------------------------------------------------------------------------------
    # Unicorn-specific Public Interface
    def instruction_callback(self, address: int, size: int) -> None:
        """
        Callback function called when Unicorn executes an instruction
        :param address: the address of the instruction
        :param size: the size of the instruction
        :return: None
        """
        # Terminate execution if the exit instruction is reached
        if self.state.is_exit_addr(address):
            self.emulator.emu_stop()
            return

        # Otherwise, update the context ...
        self.state.update_context(self.emulator, address)
        self._log.dbg_instruction(address, self, self.state, self.speculator)

        # .. and pass the instruction down to the service modules
        self._dispatcher.instruction_dispatch(address, size, self, self.state)

    def mem_access_callback(self, access: int, address: int, size: int, value: int) -> None:
        """
        Callback function called when Unicorn accesses memory.
        """
        self._log.dbg_mem_access(access == UC_HOOK_MEM_WRITE, value, address, size, self,
                                 self.layout)
        self._dispatcher.mem_access_dispatch(access, address, size, value, self.state)

    def do_soft_fault(self, errno: int) -> None:
        """
        Signal a fault to the model and stop the emulator
        (without rising an exception in the emulator)
        """
        assert self.state, "Function called before load_test_case"
        self.state.pending_fault = errno
        self.emulator.emu_stop()

    def set_faulty_area_rw(self, actor_id: int, r: bool, w: bool) -> None:
        """ Sets the 'readable' and 'writable' property of the faulty area for the given actor """
        if actor_id == -1:
            actor_id = self.state.current_actor.get_id()
        faulty_base = self.layout.get_data_addr(DataArea.FAULTY, actor_id)
        faulty_size = self.layout.data_area_size(DataArea.FAULTY)
        if not r:
            self.emulator.mem_protect(faulty_base, faulty_size, UC_PROT_NONE)
        elif not w:
            self.emulator.mem_protect(faulty_base, faulty_size, UC_PROT_READ)
        else:
            self.emulator.mem_protect(faulty_base, faulty_size)

    def report_coverage(self, path: str) -> None:
        """ Write the coverage data to a file """
        self._dispatcher.coverage.report(path)

    @abstractmethod
    def print_registers(self, oneline: bool = False) -> None:
        """ Print the current values of all general-purpose registers """

    # ----------------------------------------------------------------------------------------------
    # Private Methods
    def _execute_test_case_with_inputs(
            self, inputs: List[InputData]) -> Tuple[List[CTrace], List[InputTaint]]:
        """
        Execute the loaded test case with the given sequence of inputs
        and collect traces and taints.
        :param inputs: the inputs to use for the test case
        :return: the collected traces and taints
        """
        traces, taints = [], []
        for index, input_ in enumerate(inputs):
            self._log.dbg_header(index)
            self.state.full_reset()
            self._dispatcher.execution_start_dispatch(input_)

            # Execute the test case with the given input
            self._load_input(input_)
            self._run_state_machine()

            # Record traces (two options possible):
            if not self._enable_mismatch_check_mode:  # Case 1: normal mode - store traces
                traces.append(self.tracer.get_trace())
            else:  # Case 2: mismatch check mode - store register values
                register_list = self._uc_target_desc.usable_registers
                registers = register_list[:-2]  # exclude RSP and EFLAGS
                reg_values = [int(self.emulator.reg_read(reg)) for reg in registers]  # type: ignore
                self.tracer.trace = [CTraceEntry("reg", val) for val in reg_values]
                traces.append(self.tracer.get_trace())

            # Record taints
            n_actors = self.state.current_test_case().n_actors()
            taints.append(self._taint_tracker.get_taint(n_actors))

        return traces, taints

    def _run_state_machine(self) -> None:
        """
        Execute the loaded test case on the model with the loaded input.

        This method implements a state machine that repeatedly executes the test case
        until it reaches the exit instruction while being in a non-speculative state.

        The state machine ensures that:
            - whenever the emulator exits without reaching the exit instruction,
              the model either rolls back (if in speculation) or exits (if not in speculation)
            - whenever a fault is triggered, the model jumps to the corresponding fault handler
              (if not in speculation) or rolls back (if in speculation)
        The complete state machine is shown in:
            `docs/assets/unicorn-model-state-machine.drawio.png`.

        """
        code_start = self.layout.code_start()
        pc = code_start
        while True:
            self.state.reset_after_em_stop(pc)

            # Handle re-entries after faults and rollbacks
            if pc != code_start:
                in_speculation = self.speculator.in_speculation()

                # When entering a new loop iterations, there are the following options:
                # 1. Re-entering after reaching the end and not in speculation
                if self.state.is_exit_addr(pc) and not in_speculation:
                    return

                # 2. Re-entering after reaching the end and in speculation
                if self.state.is_exit_addr(pc) and in_speculation:
                    pc = self.speculator.rollback()
                    self._log.dbg_rollback(pc)
                    continue

                # 3. Re-entering into a fault handler and in speculation
                if pc == self.state.fault_handler_addr and in_speculation:
                    # This case indicates that the rollback was supposed to terminate speculation,
                    # so rollback again
                    pc = self.speculator.rollback()
                    self._log.dbg_rollback(pc)
                    continue
                # 4. In all other cases, continue execution as normal

            # Execute the test case
            try:
                self.emulator.emu_start(pc, self.layout.code_end(), timeout=10 * uc.UC_SECOND_SCALE)
            except UcError as e:
                self.state.pending_fault = int(e.errno)  # type: ignore  # missing type annotation

            # Handle faults
            if self.state.pending_fault:
                self._patch_context_after_fault()
                pc = self._handle_fault()
                if pc and pc != self.state.exit_addr:
                    continue

            # If the model is in non-speculative state, a fault terminates the execution
            if not self.speculator.in_speculation():
                return

            # Otherwise (in a speculative state), a fault causes a speculation rollback
            pc = self.speculator.rollback()
            self._log.dbg_rollback(pc)
            continue

    def _handle_fault(self) -> int:
        """
        Handle a fault that was triggered during the execution
        :return: address of the next instruction to execute OR zero if the fault triggers a rollback
        """
        errno = self.state.pending_fault
        self._log.dbg_exception(errno, _err_to_str(errno))

        # clear the pending fault
        self.state.pending_fault = 0

        # when a fault is triggered, CPU stores the PC and the fault type
        # on stack - this has to be mirrored at the contract level
        rsp = self.layout.get_data_addr(DataArea.RSP_INIT, 0)
        self.tracer.observe_mem_access(UC_MEM_WRITE, rsp, 8, errno)

        # Possible fault handling scenarios:
        # 1. There is a registered speculation mechanism for this fault -> use it
        next_addr = self.speculator.handle_fault(errno)
        if next_addr:
            return next_addr

        # 2. No registered speculation mechanism, but we're already in speculation -> rollback
        if self.speculator.in_speculation():
            return 0

        # 3. Not in speculation, and we've already had a fault before -> throw an error
        if self.state.had_arch_fault:
            self.print_registers()
            error(f"Nested fault {errno} {_err_to_str(errno)}", print_last_tb=True)
        self.state.had_arch_fault = True

        # 4. Not-nested non-speculative fault, and it is in a list of expected faults -> handle it
        if errno in self._handled_faults:
            return self.state.fault_handler_addr

        # 5. Non-nested non-speculative fault, and it is an unexpected fault -> throw an error
        self.print_registers()
        error(f"Unexpected exception {errno} {_err_to_str(errno)}", print_last_tb=True)

    def _patch_context_after_fault(self) -> None:
        """ Patch the context to avoid Unicorn bugs """
        if not self.state.previous_context:
            error("Fault triggered without a previous context")

        # workaround for a Unicorn bug: after catching an exception
        # we need to restore some pre-exception context. otherwise,
        # the emulator becomes corrupted
        self.emulator.context_restore(self.state.previous_context)
        # another workaround, specifically for flags
        flags_id = self._target_desc.uc_target_desc.reg_norm_to_constant["FLAGS"]
        self.emulator.reg_write(flags_id, self.emulator.reg_read(flags_id))

    @abstractmethod
    def _load_input(self, input_: InputData) -> None:
        """ Load registers and memory with given input: this is architecture specific """


# ==================================================================================================
# Public: x86 implementation of the Unicorn Backend
# ==================================================================================================
class X86UnicornModel(UnicornModel):
    """ Model for x86 architecture """

    def __init__(self,
                 bases: BaseAddrTuple,
                 target_desc: TargetDesc,
                 speculator_cls: Type[UnicornSpeculator],
                 tracer_cls: Type[UnicornTracer],
                 interpreter_cls: Type[ExtraInterpreter],
                 enable_mismatch_check_mode: bool = False) -> None:

        self._architecture = (uc.UC_ARCH_X86, uc.UC_MODE_64)
        self._flags_id = x86ucc.UC_X86_REG_EFLAGS

        self.underflow_pad_values = bytes(SandboxLayout.data_area_size(DataArea.UNDERFLOW_PAD))
        self.overflow_pad_values = bytes(SandboxLayout.data_area_size(DataArea.OVERFLOW_PAD))

        super().__init__(bases, target_desc, speculator_cls, tracer_cls, interpreter_cls,
                         enable_mismatch_check_mode)

    def _load_input(self, input_: InputData) -> None:
        """
        Set the memory and register values in the emulator according to the input object provided.
        In addition, set the memory permissions for each actor.

        :param input_: Input object containing the memory and register values for each actor.
        """

        def patch_flags(flags: np.uint64) -> np.uint64:
            return (flags & np.uint64(2263)) | np.uint64(2)

        def write_area(area: DataArea, actor_id: int, data: bytes) -> None:
            em.mem_write(self.layout.get_data_addr(area, actor_id), data)

        # shortcuts to save on typing
        em = self.emulator
        regs = self._uc_target_desc.usable_registers

        # Initialize memory for each actor:
        n_actors = self.state.current_test_case().n_actors()
        for actor_id in range(n_actors):
            input_fragment = input_[actor_id]

            # - initialize overflows with zeroes
            write_area(DataArea.OVERFLOW_PAD, actor_id, self.overflow_pad_values)
            write_area(DataArea.UNDERFLOW_PAD, actor_id, self.underflow_pad_values)

            # - sandbox data pages
            write_area(DataArea.MAIN, actor_id, input_fragment['main'].tobytes())
            write_area(DataArea.FAULTY, actor_id, input_fragment['faulty'].tobytes())

            # - GPRs
            # Note: Executor uses the GPR area to initialize EFLAGS, so we need to patch them
            #      before writing them to the emulator to ensure consistency.
            input_fragment['gpr'][6] = patch_flags(input_fragment['gpr'][6])
            # input_fragment['gpr'][7] = np.uint64(self.layout.get_data_addr(DataArea.RSP_INIT, 0))
            write_area(DataArea.GPR, actor_id, input_fragment['gpr'].tobytes())

            # - SIMD
            write_area(DataArea.SIMD, actor_id, input_fragment['simd'].tobytes())

        # Registers are initialized with the main actor's input
        input_fragment = input_[0]

        # - initialize GPRs
        value: np.uint64
        for i, value in enumerate(input_fragment['gpr']):
            em.reg_write(regs[i], int(value))

        # similarly to above, patch reg. values
        em.reg_write(x86ucc.UC_X86_REG_EFLAGS, int(patch_flags(input_fragment['gpr'][6])))
        em.reg_write(x86ucc.UC_X86_REG_RSP, self.layout.get_data_addr(DataArea.RSP_INIT, 0))
        em.reg_write(x86ucc.UC_X86_REG_RBP, self.layout.get_data_addr(DataArea.RSP_INIT, 0))
        em.reg_write(x86ucc.UC_X86_REG_R14, self.layout.get_data_addr(DataArea.MAIN, 0))

        # - initialize SIMD
        simd_values: List[int] = []
        for i, val in enumerate(input_fragment['simd']):
            if i % 4 == 0:
                simd_values.append(int(val))
            elif i % 4 == 1:
                simd_values[-1] |= int(val) << 64
            else:
                # Unicorn doesn't properly support YMM, so the upper 128 bits are ignored
                continue
        for i, simd_value in enumerate(simd_values):
            em.reg_write(self._uc_target_desc.usable_simd128_registers[i], simd_value)

    def print_registers(self, oneline: bool = False) -> None:

        def compressed(val: int) -> str:
            if self.layout.is_data_addr(val):
                return f"base+0x{self.layout.data_addr_to_offset(val):<9x}"
            return f"0x{val:016x}"

        em = self.emulator
        rax = compressed(em.reg_read(x86ucc.UC_X86_REG_RAX))  # type: ignore
        rbx = compressed(em.reg_read(x86ucc.UC_X86_REG_RBX))  # type: ignore
        rcx = compressed(em.reg_read(x86ucc.UC_X86_REG_RCX))  # type: ignore
        rdx = compressed(em.reg_read(x86ucc.UC_X86_REG_RDX))  # type: ignore
        rsi = compressed(em.reg_read(x86ucc.UC_X86_REG_RSI))  # type: ignore
        rdi = compressed(em.reg_read(x86ucc.UC_X86_REG_RDI))  # type: ignore

        if not oneline:
            print("\n\nRegisters:")
            print(f"rax: {rax}")
            print(f"rbx: {rbx}")
            print(f"rcx: {rcx}")
            print(f"rdx: {rdx}")
            print(f"rsi: {rsi}")
            print(f"rdi: {rdi}")
        else:
            if CONF.color:
                print(f"  {BLUE}rax={COL_RESET}{rax} "
                      f"{BLUE}rbx={COL_RESET}{rbx} "
                      f"{BLUE}rcx={COL_RESET}{rcx}\n"
                      f"  {BLUE}rdx={COL_RESET}{rdx} "
                      f"{BLUE}rsi={COL_RESET}{rsi} "
                      f"{BLUE}rdi={COL_RESET}{rdi}\n"
                      f"  {BLUE}flags={COL_RESET}0b{em.reg_read(x86ucc.UC_X86_REG_EFLAGS):012b}\n"
                      f"  {BLUE}xmm0={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM0):032x} "
                      f"{BLUE}xmm1={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM1):032x} \n"
                      f"  {BLUE}xmm2={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM2):032x} "
                      f"{BLUE}xmm3={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM3):032x} \n"
                      f"  {BLUE}xmm4={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM4):032x} "
                      f"{BLUE}xmm5={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM5):032x} \n"
                      f"  {BLUE}xmm6={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM6):032x} "
                      f"{BLUE}xmm7={COL_RESET}0x{em.reg_read(x86ucc.UC_X86_REG_XMM7):032x} \n")
            else:
                print(f"  rax={rax} "
                      f"rbx={rbx} "
                      f"rcx={rcx} "
                      f"rdx={rdx}\n"
                      f"  rsi={rsi} "
                      f"rdi={rdi} "
                      f"flags=0b{em.reg_read(x86ucc.UC_X86_REG_EFLAGS):012b}\n"
                      f"  xmm0=0x{em.reg_read(x86ucc.UC_X86_REG_XMM0):032x} "
                      f"xmm1=0x{em.reg_read(x86ucc.UC_X86_REG_XMM1):032x} \n"
                      f"  xmm2=0x{em.reg_read(x86ucc.UC_X86_REG_XMM2):032x} "
                      f"xmm3=0x{em.reg_read(x86ucc.UC_X86_REG_XMM3):032x} \n"
                      f"  xmm4=0x{em.reg_read(x86ucc.UC_X86_REG_XMM4):032x} "
                      f"xmm5=0x{em.reg_read(x86ucc.UC_X86_REG_XMM5):032x} \n"
                      f"  xmm6=0x{em.reg_read(x86ucc.UC_X86_REG_XMM6):032x} "
                      f"xmm7=0x{em.reg_read(x86ucc.UC_X86_REG_XMM7):032x} \n")


# ==================================================================================================
# Public: arm64 implementation of the Unicorn Backend
# ==================================================================================================
class ARM64UnicornModel(UnicornModel):
    """ Model for arm64 architecture """

    def __init__(self,
                 bases: BaseAddrTuple,
                 target_desc: TargetDesc,
                 speculator_cls: Type[UnicornSpeculator],
                 tracer_cls: Type[UnicornTracer],
                 interpreter_cls: Type[ExtraInterpreter],
                 enable_mismatch_check_mode: bool = False) -> None:

        self._architecture = (uc.UC_ARCH_ARM64, uc.UC_MODE_ARM)
        self._flags_id = armucc.UC_ARM64_REG_NZCV

        self.underflow_pad_values = bytes(SandboxLayout.data_area_size(DataArea.UNDERFLOW_PAD))
        self.overflow_pad_values = bytes(SandboxLayout.data_area_size(DataArea.OVERFLOW_PAD))

        super().__init__(bases, target_desc, speculator_cls, tracer_cls, interpreter_cls,
                         enable_mismatch_check_mode)

    def _load_input(self, input_: InputData) -> None:
        """
        Set the memory and register values in the emulator according to the input object provided.
        In addition, set the memory permissions for each actor.

        :param input_: Input object containing the memory and register values for each actor.
        """

        # FIXME: dudup this code with x86

        def patch_flags(flags: np.uint64) -> np.uint64:
            return (flags << np.uint64(28)) % np.uint64(pow(2, 64) - 1)

        def write_area(area: DataArea, actor_id: int, data: bytes) -> None:
            em.mem_write(self.layout.get_data_addr(area, actor_id), data)

        # shortcuts to save on typing
        em = self.emulator
        regs = self._uc_target_desc.usable_registers

        # Initialize memory for each actor:
        n_actors = self.state.current_test_case().n_actors()
        init_gpr: List[np.uint64]
        for actor_id in range(n_actors):
            input_fragment = input_[actor_id].copy()

            # - initialize overflows with zeroes
            write_area(DataArea.OVERFLOW_PAD, actor_id, self.overflow_pad_values)
            write_area(DataArea.UNDERFLOW_PAD, actor_id, self.underflow_pad_values)

            # - sandbox data pages
            write_area(DataArea.MAIN, actor_id, input_fragment['main'].tobytes())
            write_area(DataArea.FAULTY, actor_id, input_fragment['faulty'].tobytes())

            # - GPRs
            # Note: Executor uses the GPR area to initialize EFLAGS, so we need to patch them
            #      before writing them to the emulator to ensure consistency.
            input_fragment['gpr'][6] = patch_flags(input_fragment['gpr'][6])
            # input_fragment['gpr'][7] = np.uint64(self.layout.get_data_addr(DataArea.RSP_INIT, 0))
            write_area(DataArea.GPR, actor_id, input_fragment['gpr'].tobytes())

            # - SIMD
            write_area(DataArea.SIMD, actor_id, input_fragment['simd'].tobytes())

            # Save the GPR area of the main actor as it will be used to initialize registers
            if actor_id == 0:
                init_gpr = input_fragment['gpr']

        # - initialize GPRs
        value: np.uint64
        for i, value in enumerate(init_gpr):
            em.reg_write(regs[i], int(value))

        # similarly to above, patch reg. values
        em.reg_write(self._uc_target_desc.flags_register, int(init_gpr[6]))
        em.reg_write(self._uc_target_desc.sp_register,
                     self.layout.get_data_addr(DataArea.RSP_INIT, 0))
        em.reg_write(self._uc_target_desc.actor_base_register,
                     self.layout.get_data_addr(DataArea.MAIN, 0))

    def print_registers(self, oneline: bool = False) -> None:

        def compressed(val: int) -> str:
            if self.layout.is_data_addr(val):
                return f"base+0x{self.layout.data_addr_to_offset(val):<9x}"
            return f"0x{val:016x}"

        em = self.emulator
        x0 = compressed(em.reg_read(armucc.UC_ARM64_REG_X0))  # type: ignore
        x1 = compressed(em.reg_read(armucc.UC_ARM64_REG_X1))  # type: ignore
        x2 = compressed(em.reg_read(armucc.UC_ARM64_REG_X2))  # type: ignore
        x3 = compressed(em.reg_read(armucc.UC_ARM64_REG_X3))  # type: ignore
        x4 = compressed(em.reg_read(armucc.UC_ARM64_REG_X4))  # type: ignore
        x5 = compressed(em.reg_read(armucc.UC_ARM64_REG_X5))  # type: ignore
        flags = f"{em.reg_read(armucc.UC_ARM64_REG_NZCV) >> 28:04b}"  # type: ignore

        if not oneline:
            print("\n\nRegisters:")
            print(f"x0: {x0}")
            print(f"x1: {x1}")
            print(f"x2: {x2}")
            print(f"x3: {x3}")
            print(f"x4: {x4}")
            print(f"x5: {x5}")
        else:
            if CONF.color:
                print(f"  {BLUE}x0={COL_RESET}{x0} "
                      f"{BLUE}x1={COL_RESET}{x1} "
                      f"{BLUE}x2={COL_RESET}{x2}\n"
                      f"  {BLUE}x3={COL_RESET}{x3} "
                      f"{BLUE}x4={COL_RESET}{x4} "
                      f"{BLUE}x5={COL_RESET}{x5}\n"
                      f"  {BLUE}flags={COL_RESET}0b{flags}\n")
            else:
                print(f"  x0={x0} "
                      f"x1={x1} "
                      f"x2={x2} "
                      f"x3={x3}\n"
                      f"  x4={x4} "
                      f"x5={x5} "
                      f"flags=0b{flags}\n")


================================================
FILE: rvzr/model_unicorn/speculator_abc.py
================================================
"""
File: Abstract interface to be implemented by all speculators.
      For an implementation of concrete speculators, see speculators_*.py files.

      A speculator is a component that modifies the execution process of a test case when it
      runs on the contract model (e.g., it can emulate misprediction of branches).
      As such, speculators implement execution clauses of different contracts.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from abc import ABC
from typing import TYPE_CHECKING, List, Final, Tuple

from unicorn import UC_MEM_WRITE

from ..config import CONF

if TYPE_CHECKING:
    from unicorn import Uc
    from .model import UnicornModel
    from .taint_tracker import UnicornTaintTracker
    from ..target_desc import TargetDesc, UnicornTargetDesc

_UnicornContext = object
_InstrAddress = int
_Flags = int
_SpecWindow = int
_Checkpoint = Tuple[_UnicornContext, _InstrAddress, _Flags, _SpecWindow]

_MemoryAddress = int
_MemoryValue = bytes
_StoreLogEntry = Tuple[_MemoryAddress, _MemoryValue]


class UnicornSpeculator(ABC):
    """
    Interface definition that must be implemented by all speculators.
    as well as implementation of common functionality.
    """

    is_sequential: bool = False
    """ Flag indicating if the speculator does *not* actually implement speculation. """

    # checkpointing
    _checkpoints: List[_Checkpoint]
    _store_logs: List[List[_StoreLogEntry]]

    # speculation control
    _max_nesting: int = 0
    _speculation_window: int = 0
    _max_spec_window: int = 0
    _in_speculation: bool = False

    # connections to other modules
    _emulator: Uc
    _model: Final[UnicornModel]
    _target_desc: Final[TargetDesc]
    _uc_target_desc: Final[UnicornTargetDesc]
    _taint_tracker: UnicornTaintTracker

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__()
        self._model = model
        self._taint_tracker = taint_tracker
        self._target_desc = target_desc
        self._uc_target_desc = target_desc.uc_target_desc
        self.reset()

    # ----------------------------------------------------------------------------------------------
    # Public Interface
    def in_speculation(self) -> bool:
        """ Return whether the model is currently in speculation. """
        return self._in_speculation

    def set_max_nesting(self, max_nesting: int) -> None:
        """ Set the maximum nesting level of the model. """
        self._max_nesting = max_nesting

    def nesting(self) -> int:
        """ Return the current nesting level of the model. """
        return len(self._checkpoints)

    def reset(self) -> None:
        """ Reset the speculator to its initial state. """
        self._emulator = self._model.emulator  # refresh the emulator reference
        self._checkpoints = []
        self._store_logs = []
        self._in_speculation = False
        self._speculation_window = 0
        self._max_spec_window = CONF.model_max_spec_window

    def rollback(self) -> int:
        """ Rollback the model and its service modules to the last checkpoint. """
        # restore register values
        state, next_instr, flags, spec_window = self._checkpoints.pop()
        if not self._checkpoints:
            self._in_speculation = False

        # restore the speculation state
        self._emulator.context_restore(state)
        self._speculation_window = spec_window

        # rollback memory changes
        mem_changes = self._store_logs.pop()
        while mem_changes:
            addr, val = mem_changes.pop()
            self._emulator.mem_write(addr, val)

        # restore the flags last, to avoid corruption by other operations
        self._emulator.reg_write(self._uc_target_desc.flags_register, flags)

        # restore the taint tracking
        self._taint_tracker.rollback()

        # restart without misprediction
        return next_instr

    def handle_instruction(self, address: int, size: int) -> None:
        """
        Hook function executed by the speculator on every instruction.
        Depending on the speculator (i.e., the subclass), it may implement different speculation
        mechanisms for some instructions (e.g., branch mispredictions).
        :param address: address of the current instruction
        :param size: size of the current instruction
        :return: None
        """

        if self._in_speculation:
            self._speculation_window += 1
            # rollback on a serializing instruction
            if self._model.state.current_instruction.name in self._uc_target_desc.barriers:
                self._emulator.emu_stop()

            # and on expired speculation window
            if self._speculation_window > self._max_spec_window:
                self._emulator.emu_stop()

        self._speculate_instruction(address, size)

    def handle_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        """
        Hook function executed by the speculator on every memory access.
        Depending on the speculator (i.e., the subclass), it may implement different speculation
        mechanisms for some memory accesses (e.g., store-to-load forwarding).
        :param access: type of the memory access (UC_MEM_READ or UC_MEM_WRITE)
        :param address: address of the memory access
        :param size: size of the memory access
        :param value: value of the memory access
        :return: None
        """
        # when in speculation, log all changes to memory
        if access == UC_MEM_WRITE and self._store_logs:
            prev_value = bytes(self._emulator.mem_read(address, 8))
            self._store_logs[-1].append((address, prev_value))

        self._speculate_mem_access(access, address, size, value)

    def handle_fault(self, errno: int) -> int:
        """
        Hook function executed by the speculator on every fault.
        Depending on the speculator (i.e., the subclass), it may implement different speculation
        mechanisms for some faults (e.g., Meltdown).
        :param errno: error number of the fault
        :return: address of the next speculative instruction; 0 if no speculation
        """
        return self._speculate_fault(errno)

    # ----------------------------------------------------------------------------------------------
    # Private Methods
    def _checkpoint(self, next_instruction_addr: int, include_current_inst: bool = True) -> None:
        """
        Store a checkpoint for the current state of the model and its service modules.
        :param next_instruction_addr: address of the next instruction to execute
        :param include_current_inst: if True, include the effects of the current instruction in the
                                     checkpoint (used for taint tracking)
        """
        flags: int = self._emulator.reg_read(self._uc_target_desc.flags_register)  # type: ignore
        context = self._emulator.context_save()
        spec_window = self._speculation_window
        self._checkpoints.append((context, next_instruction_addr, flags, spec_window))
        self._store_logs.append([])
        self._in_speculation = True
        self._taint_tracker.checkpoint(include_current_inst=include_current_inst)

    def _max_nesting_reached(self) -> bool:
        """ Check if the maximum nesting level has been reached. """
        return len(self._checkpoints) >= self._max_nesting

    def _speculate_instruction(self, address: int, size: int) -> None:
        pass

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        pass

    def _speculate_fault(self, _: int) -> int:
        """
        Implement speculation upon a fault. The default implementation does not speculate.
        :param errno: ID of the fault
        :return: the address of the first speculative instruction
                 OR zero if not speculation is triggered
        """
        return 0


================================================
FILE: rvzr/model_unicorn/speculators_basic.py
================================================
"""
File: Collection of simple instruction-based speculators for the Unicorn model.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import TYPE_CHECKING, Dict, Tuple, Callable, Final, Optional
from unicorn import UC_MEM_WRITE

import unicorn.x86_const as ucc  # type: ignore # no type hints for this library
import unicorn.arm64_const as aucc  # type: ignore # no type hints for this library

from .speculator_abc import UnicornSpeculator
from ..config import CONF

if TYPE_CHECKING:
    from .model import UnicornModel
    from .taint_tracker import UnicornTaintTracker
    from ..target_desc import TargetDesc

FLAGS_CF = 0b000000000001
FLAGS_PF = 0b000000000100
FLAGS_AF = 0b000000010000
FLAGS_ZF = 0b000001000000
FLAGS_SF = 0b000010000000
FLAGS_TF = 0b000100000000
FLAGS_IF = 0b001000000000
FLAGS_DF = 0b010000000000
FLAGS_OF = 0b100000000000

FLAGS_N: Final[int] = 1 << 31
FLAGS_Z: Final[int] = 1 << 30
FLAGS_C: Final[int] = 1 << 29
FLAGS_V: Final[int] = 1 << 28


class SeqSpeculator(UnicornSpeculator):
    """
    Trivial speculator that does not implement any speculation; that is, it models
    sequential execution of all instructions
    """

    is_sequential: bool = True


_CondBranchFlipper = Callable[[bytearray, int, int], Tuple[bytearray, bool, bool]]


# ==================================================================================================
# Conditional branch prediction (Spectre v1)
# ==================================================================================================
class X86CondSpeculator(UnicornSpeculator):
    """
    Speculator for conditional branch mispredicitons.
    Forces all cond. branches to speculatively go into a wrong target
    """

    jumps = {
        # c - the byte code of the instruction
        # f - the value of EFLAGS
        0x70:
            lambda c, f, r: (c[1:], f & FLAGS_OF != 0, False),  # JO
        0x71:
            lambda c, f, r: (c[1:], f & FLAGS_OF == 0, False),  # JNO
        0x72:
            lambda c, f, r: (c[1:], f & FLAGS_CF != 0, False),  # JB
        0x73:
            lambda c, f, r: (c[1:], f & FLAGS_CF == 0, False),  # JAE
        0x74:
            lambda c, f, r: (c[1:], f & FLAGS_ZF != 0, False),  # JZ
        0x75:
            lambda c, f, r: (c[1:], f & FLAGS_ZF == 0, False),  # JNZ
        0x76:
            lambda c, f, r: (c[1:], f & FLAGS_CF != 0 or f & FLAGS_ZF != 0, False),  # JNA
        0x77:
            lambda c, f, r: (c[1:], f & FLAGS_CF == 0 and f & FLAGS_ZF == 0, False),  # JNBE
        0x78:
            lambda c, f, r: (c[1:], f & FLAGS_SF != 0, False),  # JS
        0x79:
            lambda c, f, r: (c[1:], f & FLAGS_SF == 0, False),  # JNS
        0x7A:
            lambda c, f, r: (c[1:], f & FLAGS_PF != 0, False),  # JP
        0x7B:
            lambda c, f, r: (c[1:], f & FLAGS_PF == 0, False),  # JPO
        0x7C:
            lambda c, f, r: (c[1:], (f & FLAGS_SF == 0) != (f & FLAGS_OF == 0), False),  # JNGE
        0x7D:
            lambda c, f, r: (c[1:], (f & FLAGS_SF == 0) == (f & FLAGS_OF == 0), False),  # JNL
        0x7E:
            lambda c, f, r: (
                c[1:],
                f & FLAGS_ZF != 0 or (f & FLAGS_SF == 0) != (f & FLAGS_OF == 0),
                False,
            ),
        0x7F:
            lambda c, f, r: (
                c[1:],
                f & FLAGS_ZF == 0 and (f & FLAGS_SF == 0) == (f & FLAGS_OF == 0),
                False,
            ),
        0xE0:
            lambda c, f, r: (c[1:], r != 1 and (f & FLAGS_ZF == 0), True),  # LOOPNE
        0xE1:
            lambda c, f, r: (c[1:], r != 1 and (f & FLAGS_ZF != 0), True),  # LOOPE
        0xE2:
            lambda c, f, r: (c[1:], r != 1, True),  # LOOP
        0xE3:
            lambda c, f, r: (c[1:], r == 0, False),  # J*CXZ
        0x0F:
            lambda c, f, r: X86CondSpeculator.multibyte_jmp.get(c[1], (lambda _, __, ___:
                                                                       ([0], False, False)))
            (c, f, r),
    }

    multibyte_jmp: Final[Dict[int, _CondBranchFlipper]] = {
        0x80:
            lambda c, f, r: (c[2:], f & FLAGS_OF != 0, False),  # JO
        0x81:
            lambda c, f, r: (c[2:], f & FLAGS_OF == 0, False),  # JNO
        0x82:
            lambda c, f, r: (c[2:], f & FLAGS_CF != 0, False),  # JB
        0x83:
            lambda c, f, r: (c[2:], f & FLAGS_CF == 0, False),  # JAE
        0x84:
            lambda c, f, r: (c[2:], f & FLAGS_ZF != 0, False),  # JE
        0x85:
            lambda c, f, r: (c[2:], f & FLAGS_ZF == 0, False),  # JNE
        0x86:
            lambda c, f, r: (c[2:], f & FLAGS_CF != 0 or f & FLAGS_ZF != 0, False),  # JBE
        0x87:
            lambda c, f, r: (c[2:], f & FLAGS_CF == 0 and f & FLAGS_ZF == 0, False),  # JA
        0x88:
            lambda c, f, r: (c[2:], f & FLAGS_SF != 0, False),  # JS
        0x89:
            lambda c, f, r: (c[2:], f & FLAGS_SF == 0, False),  # JNS
        0x8A:
            lambda c, f, r: (c[2:], f & FLAGS_PF != 0, False),  # JP
        0x8B:
            lambda c, f, r: (c[2:], f & FLAGS_PF == 0, False),  # JPO
        0x8C:
            lambda c, f, r: (c[2:], (f & FLAGS_SF == 0) != (f & FLAGS_OF == 0), False),  # JNGE
        0x8D:
            lambda c, f, r: (c[2:], (f & FLAGS_SF == 0) == (f & FLAGS_OF == 0), False),  # JNL
        0x8E:
            lambda c, f, r: (
                c[2:],
                f & FLAGS_ZF != 0 or (f & FLAGS_SF == 0) != (f & FLAGS_OF == 0),
                False,
            ),
        0x8F:
            lambda c, f, r: (
                c[2:],
                f & FLAGS_ZF == 0 and (f & FLAGS_SF == 0) == (f & FLAGS_OF == 0),
                False,
            ),
    }

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        assert CONF.instruction_set == "x86-64"

    def _speculate_instruction(self, address: int, size: int) -> None:
        if self._max_nesting_reached():  # reached max spec. window? skip
            return

        # if the instruction is undefined, Unicorn will return a huge value as size
        # skip those
        if size > 15:  # 15 bytes is max instr size on Intel
            return

        # decode the instruction
        code: bytearray = self._emulator.mem_read(address, size)
        flags: int = self._emulator.reg_read(self._uc_target_desc.flags_register)  # type: ignore
        rcx: int = self._emulator.reg_read(ucc.UC_X86_REG_RCX)  # type: ignore
        target, will_jump, is_loop = self.decode(code, flags, rcx)

        # not a a cond. jump? ignore
        if not target:
            return

        # LOOP instructions must also decrement RCX
        if is_loop:
            self._emulator.reg_write(ucc.UC_X86_REG_RCX, rcx - 1)

        # Take a checkpoint
        next_instr = address + size + target if will_jump else address + size
        self._checkpoint(next_instr)

        # Simulate misprediction
        if will_jump:
            self._emulator.reg_write(ucc.UC_X86_REG_RIP, address + size)
        else:
            self._emulator.reg_write(ucc.UC_X86_REG_RIP, address + size + target)

    def decode(self, code: bytearray, flags: int, rcx: int) -> Tuple[int, bool, bool]:
        """
        Decodes the instruction encoded in `code` and, if it's a conditional jump,
        returns its expected target, whether it will jump to the target (based
        on the `flags` value), and whether it is a LOOP instruction
        """
        calculate_target = \
            self.jumps.get(code[0], (lambda _, __, ___: ([0], False, False)))
        target, will_jump, is_loop = calculate_target(code, flags, rcx)  # type: ignore
        if len(target) == 1:
            return target[0], will_jump, is_loop
        return int.from_bytes(target, byteorder='little', signed=True), will_jump, is_loop


class ARM64CondSpeculator(UnicornSpeculator):
    """
    Speculator for conditional branch mispredictions on ARM64.
    Forces all cond. branches to speculatively go into a wrong target
    """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        assert CONF.instruction_set == "arm64"

    def _speculate_instruction(self, address: int, size: int) -> None:
        if self._max_nesting_reached():  # reached max spec. window? skip
            return

        # decode the instruction
        code: bytearray = self._emulator.mem_read(address, size)
        flags: int = self._emulator.reg_read(self._uc_target_desc.flags_register)  # type: ignore
        target_offset, will_jump = self.decode(code, flags)

        # not a a cond. jump? ignore
        if not target_offset:
            return

        # Take a checkpoint
        next_instr = address + size + target_offset if will_jump else address + size
        self._checkpoint(next_instr)

        # Simulate misprediction
        target_addr = address + size if will_jump else address + size + target_offset
        self._emulator.reg_write(self._uc_target_desc.pc_register, target_addr)

    def decode(self, code: bytearray, flags: int) -> Tuple[int, bool]:
        """
        Decodes the instruction encoded in `code` and, if it's a conditional jump,
        returns its expected target and whether it will jump to the target (based
        on the `flags` value).
        """
        instruction = int.from_bytes(code, byteorder='little')
        first_byte = instruction >> 24
        if first_byte == 0x54 and instruction & 0x10 == 0:
            # B.cond instruction
            return self._decode_b_cond(instruction, flags)

        if 0xb4 <= first_byte <= 0xb7 or 0x34 <= first_byte <= 0x37:
            # CBZ/CBNZ/TBZ/TBNZ
            return self._decode_cb_tb(instruction, first_byte)
        return (0, False)

    def _decode_b_cond(self, instruction: int, flags: int) -> Tuple[int, bool]:
        target = self._twos_complement(instruction >> 5, 19)
        condition = instruction & 0xf
        n = (flags & FLAGS_N) != 0
        z = (flags & FLAGS_Z) != 0
        c = (flags & FLAGS_C) != 0
        v = (flags & FLAGS_V) != 0
        # table here is useful:
        # https://community.arm.com/arm-community-blogs/b/
        # architectures-and-processors-blog/posts/condition-codes-1-condition-flags-and-codes
        will_jump = [
            z,  # 0 = b.eq "equal"
            not z,  # 1 = b.ne "not equal"
            c,  # 2 = b.cs "carry set"
            not c,  # 3 = b.cc "carry clear"
            n,  # 4 = b.mi "minus"
            not n,  # 5 = b.pl "plus"
            v,  # 6 = b.vs "overflow set"
            not v,  # 7 = b.vc "overflow clear"
            c and not z,  # 8 = b.hi "higher than"
            not c or z,  # 9 = b.ls "lower or same"
            n == v,  # a = b.ge "greater than or equal"
            n != v,  # b = b.lt "less than"
            not z and n == v,  # c = b.gt "greater than"
            z or n != v,  # d = b.le "less than or equal"
            True,  # e = b.al "always"
            False,  # f = b.nv "never"
        ][condition]
        return (target, will_jump)

    def _decode_cb_tb(self, instruction: int, first_byte: int) -> Tuple[int, bool]:
        # CBZ/CBNZ/TBZ/TBNZ
        register_index = instruction & 0x1f
        is_32bit = first_byte >> 4 == 0x3

        register_value: int
        if register_index < 31:
            # for some reason UC_ARM64_REG_X29 != UC_ARM64_REG_X0 + 29
            uc_reg_id = \
                (aucc.UC_ARM64_REG_X0 + register_index) if register_index <= 28 else \
                (aucc.UC_ARM64_REG_X29 + (register_index - 29))

            register_value = self._emulator.reg_read(uc_reg_id)  # type: ignore
        elif register_index == 31:
            # xzr "zero register"
            register_value = 0
        else:
            raise ValueError(f"Invalid register index {register_index} in CBZ/CBNZ/TBZ/TBNZ")

        if is_32bit:
            register_value &= 0xffff_ffff
        if first_byte & 0xf <= 0x5:
            # CBZ/CBNZ
            target = self._twos_complement(instruction >> 5, 19)
            if first_byte & 0xf == 4:
                # CBZ
                will_jump = register_value == 0
            else:
                # CBNZ
                will_jump = register_value != 0
        else:
            target = self._twos_complement(instruction >> 5, 14)
            bit_number = (instruction >> 19) & 0x1f
            if not is_32bit:
                bit_number += 32
            bit = register_value & (1 << bit_number)
            if first_byte & 0xf == 6:
                # TBZ
                will_jump = bit == 0
            else:
                # TBNZ
                will_jump = bit != 0
        return (target, will_jump)

    @staticmethod
    def _twos_complement(n: int, n_bits: int) -> int:
        n &= (1 << n_bits) - 1
        sign_bit = 1 << (n_bits - 1)
        if n & sign_bit:
            return n - 2 * sign_bit
        return n


# ==================================================================================================
# Speculative Store Bypass (Spectre v4)
# ==================================================================================================
class StoreBpasSpeculator(UnicornSpeculator):
    """
    Speculator for speculative store bypasses.
    Speculatively skips memory store if it is followed by a load from the same address.
    """
    _previous_store: Optional[Tuple[int, int, int, int]] = None

    def rollback(self) -> int:
        # if there are any pending speculative store bypasses, cancel them
        self._previous_store = None
        return super().rollback()

    def reset(self) -> None:
        self._previous_store = None
        super().reset()

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        # Since Unicorn does not have post-instruction hooks,
        # we have to implement it in a dirty way:
        # Save the information about the store here, but execute all the
        # contract logic in a hook before the next instruction (see trace_instruction)
        if access == UC_MEM_WRITE:
            # check for duplicate calls
            if self._previous_store is not None:
                end_addr = address + size
                prev_addr, prev_size = self._previous_store[0:2]
                if address >= prev_addr and end_addr <= (prev_addr + prev_size):
                    prev_val = self._previous_store[3].\
                        to_bytes(prev_size, byteorder='little', signed=self._previous_store[3] < 0)
                    sliced = prev_val[address - prev_addr:end_addr - prev_addr][0]
                    if sliced == value:
                        return
                    raise NotImplementedError("Self-overwriting instructions are not supported")
                raise NotImplementedError("Instructions with multiple stores are not supported")

            # it's not a duplicate - initiate speculation
            old_val: int = self._emulator.mem_read(address, size)  # type: ignore
            self._previous_store = (address, size, old_val, value)

    def _speculate_instruction(self, address: int, _: int) -> None:
        if self._max_nesting_reached():  # reached max spec. window? skip
            self._previous_store = None  # clear pending speculation requests
            return

        if self._previous_store is not None:
            store_addr = self._previous_store[0]
            old_value = bytes(self._previous_store[2])
            new_is_signed = self._previous_store[3] < 0
            new_value = (self._previous_store[3]). \
                to_bytes(self._previous_store[1], byteorder='little', signed=new_is_signed)

            # store a checkpoint (do not include the effects of the current instruction as the
            # speculation was actually triggered by the previous instruction)
            self._checkpoint(address, include_current_inst=False)

            # cancel the previous store but preserve its value
            self._emulator.mem_write(store_addr, old_value)
            self._store_logs[-1].append((store_addr, new_value))
        self._previous_store = None


class X86CondBpasSpeculator(X86CondSpeculator, StoreBpasSpeculator):
    """
    Speculator that combines conditional branch mispredictions and speculative store bypass.
    """

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        super(StoreBpasSpeculator, self)._speculate_mem_access(access, address, size, value)

    def _speculate_instruction(self, address: int, size: int) -> None:
        super(X86CondSpeculator, self)._speculate_instruction(address, size)


================================================
FILE: rvzr/model_unicorn/speculators_fault.py
================================================
"""
File: Collection of fault-based (i.e., Meltdown type) speculators for the Unicorn backend.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

from __future__ import annotations

from abc import ABC, abstractmethod
from typing import TYPE_CHECKING, Set, Tuple, List
from copy import copy
import re

from unicorn import UC_MEM_WRITE
import unicorn.x86_const as ucc  # type: ignore # no type hints for this library

from .speculator_abc import UnicornSpeculator
from ..tc_components.instruction import Instruction, RegisterOp, FlagsOp, MemoryOp, ImmediateOp

if TYPE_CHECKING:
    from ..target_desc import TargetDesc
    from .model import UnicornModel
    from .taint_tracker import UnicornTaintTracker
    from ..tc_components.actor import ActorID


# ==================================================================================================
# Base class for all fault-based speculators
# ==================================================================================================
class FaultSpeculator(UnicornSpeculator, ABC):
    """
    Common set of functionality for all fault-based speculators.
    Namely, it:
    - provides a universal method for identifying if a given fault should trigger speculation
    - provides a method for configuring the speculation rollback address
    - records address of the current instruction,
      which is used by subclasses to determine speculation starting points
    """

    _errno_that_trigger_speculation: Set[int]  # set by subclasses
    _curr_instruction_addr: int = 0

    def _fault_triggers_speculation(self, errno: int) -> bool:
        """Check if the fault should trigger speculation"""
        # we speculate only on a subset of faults
        if errno not in self._errno_that_trigger_speculation:
            return False

        # no speculation after the maximum nesting level is reached
        if self._max_nesting_reached():
            return False
        return True

    def _get_rollback_address(self) -> int:
        return self._model.state.fault_handler_addr

    def _speculate_instruction(self, address: int, size: int) -> None:
        self._curr_instruction_addr = address

    def _restore_faulty_page_permissions(self, actor_id: ActorID) -> None:
        assert (self._model.state.page_permissions
                is not None), "Page permissions were not initialized"
        org_permissions = self._model.state.page_permissions[actor_id]
        self._model.set_faulty_area_rw(actor_id, org_permissions[0], org_permissions[1])


# ==================================================================================================
# Microcode assists
# ==================================================================================================
class SequentialAssistSpeculator(FaultSpeculator):
    """Speculator that simulates sequential handling of memory-based microcode assists"""

    def __init__(
        self,
        target_desc: TargetDesc,
        model: UnicornModel,
        taint_tracker: UnicornTaintTracker,
    ) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {12, 13}

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # no speculation - simply reset the permissions to permit access
        self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True, True)
        return self._curr_instruction_addr


# ==================================================================================================
# Simple Out-of-Order Exception Handling
# ==================================================================================================
class UnicornDEH(FaultSpeculator, ABC):
    """
    Base class for delayed exception handling (DEH) speculators.
    Models delayed handling in out-of-order CPUs, where an non-data-dependent instructions may
    be executed before a faulting instruction is retired.

    Example:
        mov rax, [faulty_addr]  ; load from faulty address (may fault)
        mov rbx, [non-faulty_addr] ; independent load (may be executed before the fault is handled)
        mov [some_addr], rax    ; store the loaded value (should be skipped if the load faults)
    """

    _dependencies: Set[str]
    _dependency_checkpoints: List[Set[str]]
    _next_instruction_addr: int = 0

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {6, 10, 12, 13, 21}
        self._dependencies = set()
        self._dependency_checkpoints = []

    def _checkpoint(self, next_instruction_addr: int, include_current_inst: bool = True) -> None:
        self._dependency_checkpoints.append(copy(self._dependencies))
        return super()._checkpoint(next_instruction_addr, include_current_inst=include_current_inst)

    def rollback(self) -> int:
        self._dependencies = self._dependency_checkpoints.pop()
        return super().rollback()

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # start speculation
        # we set the rollback address to the end of the testcase
        # because faults are terminating execution
        self._checkpoint(self._get_rollback_address())

        # add destinations to the dependency list
        for op in self._model.state.current_instruction.get_dest_operands(True):
            if isinstance(op, RegisterOp):
                self._dependencies.add(self._target_desc.reg_normalized[op.value])
            elif isinstance(op, FlagsOp):
                for flag in op.get_flags_by_type("write"):
                    self._dependencies.add(flag)

        # speculatively skip the faulting instruction
        if self._model.state.is_exit_addr(self._next_instruction_addr):
            return 0  # no need for speculation if we're at the end

        self._arm64_emulate_fault_with_post_increment()
        return self._next_instruction_addr

    def _speculate_instruction(self, address: int, size: int) -> None:
        """
        Track instruction dependencies to skip those instructions that are dependent
        on a faulting instruction
        """
        # pylint: disable=too-many-branches
        # FIXME: refactor this method to reduce complexity;
        # for now, it's left as is, because this contract is not a priority
        super()._speculate_instruction(address, size)

        # check that the instruction size is correct (may be wrong for invalid instructions)
        if self._model.state.current_instruction.size() not in [0, size]:
            size = self._model.state.current_instruction.size()
        self._next_instruction_addr = address + size

        # reset flag
        instruction = self._model.state.current_instruction

        # track dependencies only after faults
        if not self._in_speculation or not self._dependencies:
            return

        # check if the instruction should be skipped due to a dependency on a faulting instr
        reg_src_operands = []
        reg_dest_operands = []
        address_regs = []
        for op in instruction.get_all_operands():
            if isinstance(op, RegisterOp):
                if op.src:
                    reg_src_operands.append(self._target_desc.reg_normalized[op.value])
                if op.dest:
                    reg_dest_operands.append(self._target_desc.reg_normalized[op.value])
            elif isinstance(op, MemoryOp):
                for sub_op in re.split(r"\+|-|\*| ", op.value):
                    if sub_op and sub_op in self._target_desc.reg_normalized:
                        normalized = self._target_desc.reg_normalized[sub_op]
                        reg_src_operands.append(normalized)
                        address_regs.append(normalized)
            elif isinstance(op, FlagsOp):
                reg_src_operands.extend(op.get_flags_by_type("read"))
                reg_dest_operands.extend(op.get_flags_by_type("write"))

        is_dependent = False
        is_dependent_addr = False
        for reg in reg_src_operands:
            if reg in self._dependencies:
                is_dependent = True
                break
        for reg in address_regs:
            if reg in self._dependencies:
                is_dependent_addr = True

        # remove overwritten values from dependencies
        old_dependencies = list(self._dependencies)  # type cast to force copy
        for reg in reg_dest_operands:
            if reg not in reg_src_operands and reg in self._dependencies:
                self._dependencies.remove(reg)

        if not is_dependent:
            return

        # update dependencies
        for reg in reg_dest_operands:
            self._dependencies.add(reg)

        # Corner cases
        self._handle_isa_specific_corner_cases(instruction, old_dependencies, reg_dest_operands)

        # special case - many memory operations are implemented as two uops,
        # and one of them could be expected even if the other is data-dependent
        # we approximate it by simply not skipping the dependent stores
        if instruction.has_mem_operand(True) and not is_dependent_addr:
            return

        # this instruction is dependent on a faulting instruction -> skip it
        self._emulator.reg_write(ucc.UC_X86_REG_RIP, address + size)

    @abstractmethod
    def _handle_isa_specific_corner_cases(self, instruction: Instruction,
                                          old_dependencies: List[str],
                                          reg_dest_operands: List[str]) -> None:
        """Handle ISA-specific corner cases in dependency tracking"""

    def _arm64_emulate_fault_with_post_increment(self) -> None:
        """ Workaround for ARM64 post-incrementing loads/stores that trigger a page fault"""


class X86UnicornDEH(UnicornDEH):
    """
    x86-64 implementation of delayed exception handling (DEH).
    Extends the base DEH class with x86-specific corner cases, such as:
    - cmpxchg does not always taint RAX
    - exchange instruction swaps dependencies
    - XADD overrides the src taint with the dest taint
    - zeroing and reset patterns (e.g., xor rax, rax)
    """

    def _handle_isa_specific_corner_cases(self, instruction: Instruction,
                                          old_dependencies: List[str],
                                          reg_dest_operands: List[str]) -> None:
        # pylint: disable=too-many-branches

        # special case 1 - cmpxchg does not always taint RAX
        name = instruction.name
        if "cmpxchg" in name:
            dest = instruction.operands[0]
            if (isinstance(dest, MemoryOp)
                    or self._target_desc.reg_normalized[dest.value] not in old_dependencies):
                self._dependencies.remove(self._target_desc.reg_normalized["rax"])
                flags = instruction.get_flags_operand()
                assert flags
                for flag in flags.get_flags_by_type("write"):
                    self._dependencies.remove(flag)
            return

        # special case 2 - exchange instruction swaps dependencies
        if "xchg" in name:
            assert len(instruction.operands) == 2
            op1, op2 = instruction.operands
            if isinstance(op1, RegisterOp):
                # swap dependencies
                op1_val, op2_val = [self._target_desc.reg_normalized[op.value] for op in [op1, op2]]
                if op1_val in old_dependencies and op2_val not in old_dependencies:
                    self._dependencies.remove(op1_val)
                elif op1_val not in old_dependencies and op2_val in old_dependencies:
                    self._dependencies.remove(op2_val)
            else:
                # memory is never tainted -> override the src dependency
                op2_val = self._target_desc.reg_normalized[op2.value]
                if op2_val in old_dependencies:
                    self._dependencies.remove(op2_val)
            return

        # special case 3 - XADD overrides the src taint with the dest taint
        if "xadd" in name:
            assert len(instruction.operands) == 2
            op1, op2 = instruction.operands
            if (isinstance(op1, MemoryOp)
                    or self._target_desc.reg_normalized[op1.value] not in old_dependencies):
                self._dependencies.remove(self._target_desc.reg_normalized[op2.value])
            return

        # special case 4 - zeroing and reset patterns
        if name in ["sub", "lock sub", "sbb", "lock sbb", "xor", "lock xor", "cmp"]:
            assert len(instruction.operands) == 2
            op1, op2 = instruction.operands
            if op1.value == op2.value:
                for reg in reg_dest_operands:
                    self._dependencies.remove(reg)
            return


class ARMUnicornDEH(UnicornDEH):
    """
    ARM64 implementation of delayed exception handling (DEH).
    Currently, there are no known corner cases for ARM64.
    """

    def _handle_isa_specific_corner_cases(self, instruction: Instruction,
                                          old_dependencies: List[str],
                                          reg_dest_operands: List[str]) -> None:
        pass  # No known corner cases for ARM yet

    def _arm64_emulate_fault_with_post_increment(self) -> None:
        """
        Workaround for ARM64 handling of faults:
        If a post-incrementing load/store triggers a page fault,
        the address register is still incremented by the immediate value.

        E.g., if the instruction is `ldr x0, [x1], #8` and it faults,
        x1 is still speculatively incremented by 8, even though the load did not complete.
        """
        instr = self._model.state.current_instruction
        if "ldr" not in instr.name and "str" not in instr.name:
            return  # instruction cannot have post-increment

        # check if the instruction has a post-incrementing operand
        operands = instr.get_all_operands()
        if not isinstance(operands[-1], ImmediateOp):
            return

        # find the register being incremented
        mem_addr_op = operands[-2]
        assert isinstance(mem_addr_op, MemoryOp)
        addr_reg = mem_addr_op.get_base_register()
        if addr_reg is None:
            return

        # increment the register
        increment_str = operands[-1].value
        increment = int(increment_str[1:]) if increment_str.startswith("#") else int(increment_str)
        uc_reg = self._target_desc.uc_target_desc.reg_str_to_constant[addr_reg.value]
        curr_value = int(self._emulator.reg_read(uc_reg))  # type: ignore
        new_value = curr_value + increment
        self._emulator.reg_write(uc_reg, new_value)


# ==================================================================================================
# Value-injection Speculation
# ==================================================================================================
class X86UnicornNull(FaultSpeculator):
    """
    Contract describing zero injection on faults.

    Algorithm:
    - On a faulting load:
        * store the checkpoint
        * overwrite the loaded value with zero
        * change the permissions on the faulting page to RW
        * re-execute the instruction
    - On rollback:
        * restore the original permissions on the faulting page
        * rollback the memory and register values
        * jump to the rollback address
    """

    _curr_load: Tuple[int, int]
    _pending_re_execution: bool = False
    _pending_restore_permissions: bool = False

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {12, 13}

    def reset(self) -> None:
        if not getattr(self._model, "state", None):
            super().reset()
            return

        # This contract handles REP instructions incorrectly (it's a known bug)
        # Explicitly fail if a REP instruction is detected
        for bb in self._model.state.current_test_case().iter_basic_blocks():
            for instr in bb:
                if "rep" in instr.name:
                    raise ValueError(
                        "REP instructions are not supported by this contract\n"
                        "Exclude all REP instructions from the instruction set, or change contract")
        super().reset()

    def rollback(self) -> int:
        actor_id = self._model.state.current_actor.get_id()
        self._model.set_faulty_area_rw(actor_id, True, True)
        return super().rollback()

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        # (this method is called before _speculate_fault)

        if access == UC_MEM_WRITE:
            return
        # save load address in case this instruction may fault
        self._curr_load = (address, size)

    def _speculate_fault(self, errno: int) -> int:
        # (this method is called after _speculate_mem_access)

        # check if the fault should trigger speculation
        if not self._fault_triggers_speculation(errno):
            return 0

        # store a checkpoint
        self._checkpoint(self._get_rollback_address())

        # inject zero in the load
        address, size = self._curr_load
        if address != 0:
            # log old value before injecting zero value
            prev_value = bytes(self._emulator.mem_read(address, 8))
            self._store_logs[-1].append((address, prev_value))

            # inject zeros
            self._emulator.mem_write(address, bytes([0 for _ in range(size)]))

        # enable access to the faulting page and repeat the instruction
        self._pending_re_execution = True
        actor_id = self._model.state.current_actor.get_id()
        self._model.set_faulty_area_rw(actor_id, True, True)
        return self._curr_instruction_addr

    def _speculate_instruction(self, address: int, size: int) -> None:
        super()._speculate_instruction(address, size)

        # Case 1: this method is called after a fault (i.e., after _speculate_fault)
        #  -> re-executed the faulting instruction
        if self._pending_re_execution:
            self._pending_re_execution = False
            self._pending_restore_permissions = True
            self._curr_load = (0, 0)
            return

        # Case 2: this method is called after the first instruction in speculation
        # (i.e., after one call of _speculate_instruction)
        #  -> restore the permissions of the faulting page
        if self._pending_restore_permissions:
            self._pending_restore_permissions = False
            self._restore_faulty_page_permissions(self._model.state.current_actor.get_id())
            self._curr_load = (0, 0)
            return

        # Case 3: any other case
        #  -> Do nothing
        self._curr_load = (0, 0)


class X86UnicornNullAssist(X86UnicornNull):
    """Variant of X86UnicornNull that does *not* terminate execution after a fault,
    and instead rolls back to the faulting instruction after speculation, and executes
     it without a fault."""

    def _get_rollback_address(self) -> int:
        return self._curr_instruction_addr


class X86Meltdown(FaultSpeculator):
    """
    Loads from the faulty region speculatively return the in-memory value
    """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {12, 13}

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # store a checkpoint
        self._checkpoint(self._get_rollback_address())

        # remove protection
        self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True, True)
        return self._curr_instruction_addr


class X86NonCanonicalAddress(FaultSpeculator):
    """
    Load from non-canonical address
    """

    faulty_instruction_addr: int = -1
    address_register: int = -1
    register_value: int = -1

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {6, 7}

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        self._checkpoint(self._model.state.fault_handler_addr)
        self.faulty_instruction_addr = self._curr_instruction_addr
        return self._curr_instruction_addr

    def _speculate_instruction(self, address: int, size: int) -> None:
        super()._speculate_instruction(address, size)

        if not self._in_speculation:
            return

        model = self._model
        if self.address_register != -1:
            model.emulator.reg_write(self.address_register, self.register_value)
            self.address_register = -1
            return

        if self.faulty_instruction_addr != address:
            return

        # Fix non-canonical address
        for mem_op in model.state.current_instruction.get_mem_operands(True):
            registers = re.split(r"\+|-|\*| ", mem_op.value)
            if len(registers) > 1:
                continue

            uc_reg = self._target_desc.uc_target_desc.reg_str_to_constant[registers[0]]
            load_address: int = model.emulator.reg_read(uc_reg)  # type: ignore
            is_canonical: bool = (
                load_address > 0xFFFF800000000000 or load_address < 0x00007FFFFFFFFFFF)
            if not is_canonical:
                self.address_register = uc_reg
                self.register_value = load_address

                if load_address & (1 << 47):  # bit 48 is 1 => high address
                    load_address = load_address | 0xFFFF800000000000
                else:  # bit 48 is 0 => low address
                    load_address = load_address & 0x00007FFFFFFFFFF
                model.emulator.reg_write(uc_reg, load_address)
                return
        return

    def reset(self) -> None:
        self.faulty_instruction_addr = -1
        self.address_register = -1
        self.register_value = -1
        return super().reset()


================================================
FILE: rvzr/model_unicorn/speculators_vs.py
================================================
"""
File: Collection of unknown value speculation speculators for the Unicorn backend.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# FIXME: pylint is disabled for this file because it is currently not maintained
# pylint: disable=too-many-instance-attributes, too-many-locals
# pylint: disable=too-many-branches, too-many-statements

from __future__ import annotations

from abc import ABC
from typing import TYPE_CHECKING, Set, Tuple, List, NamedTuple, Dict, Final

import re
from copy import copy

from unicorn import UC_MEM_WRITE

from .speculators_basic import FLAGS_CF, FLAGS_PF, FLAGS_AF, FLAGS_ZF, FLAGS_SF, FLAGS_TF, \
    FLAGS_IF, FLAGS_DF, FLAGS_OF
from .speculators_fault import FaultSpeculator, X86NonCanonicalAddress
from ..tc_components.instruction import RegisterOp, FlagsOp, MemoryOp, AgenOp

if TYPE_CHECKING:
    from ..tc_components.test_case_data import InputData
    from ..target_desc import TargetDesc
    from .model import UnicornModel
    from .taint_tracker import UnicornTaintTracker


class _TaintedValue(NamedTuple):
    po: int
    label: int
    value: int


Taint = Set[_TaintedValue]

_FLAG_NAME_TO_BITMASK: Final[Dict[str, int]] = {
    "CF": FLAGS_CF,
    "PF": FLAGS_PF,
    "AF": FLAGS_AF,
    "ZF": FLAGS_ZF,
    "SF": FLAGS_SF,
    "TF": FLAGS_TF,
    "IF": FLAGS_IF,
    "DF": FLAGS_DF,
    "OF": FLAGS_OF
}


class _VspecBaseSpeculator(FaultSpeculator, ABC):
    """
    Base class for unknown value speculation, implementing VSOps algorithm.

    The algorithm is described in Section 6 of the paper "Speculation at Fault: Modeling and Testing
    Microarchitectural Leakage of CPU Exceptions" by Hofmann et al.
    """
    _input_hash: int = 0
    _full_input_taint: _TaintedValue
    _reg_taints: Dict[str, Taint]
    """ reg_taints: taints of registers """
    _reg_taints_checkpoints: List[Dict[str, Taint]]
    _mem_taints: Dict[int, Taint]
    """ mem_taints: taints of memory locations """
    _mem_taints_checkpoints: List[Dict[int, Taint]]
    _whole_memory_tainted: bool = False
    """ whole_memory_tainted: overapproximation recording whole memory as being corrupted/tainted"""
    _whole_memory_tainted_checkpoints: List[bool]
    _curr_observation: Taint = set()
    """ _curr_observation: taints+values that need to be leaked if current instruction is
        a memory access """
    _curr_mem_load: Tuple[int, int] = (-1, -1)
    """ _curr_mem_load: address and size of last memory load (needed in case of exception) """
    _curr_mem_store: Tuple[int, int] = (-1, -1)
    """ _curr_mem_store: address and size of last memory store (needed in case of exception) """
    _curr_dest_regs: List[str] = []
    """ _curr_dest_regs: current destination registers """
    _curr_dest_regs_sizes: Dict[str, int]
    """ curr_dest_regs_sizes: width of current destination registers, i.e., whether only part of
        register gets overwritten """
    _curr_taint: Taint
    """ curr_taint: current taint+values that are propagated from _speculate_instruction()
        to trace_mem_access() """
    _curr_src_tainted: bool = False
    """ remembers if any source operand was tainted in _speculate_instruction """
    _next_instruction_addr: int = 0

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {6, 7, 12, 13}

        self._reg_taints = {}
        self._reg_taints_checkpoints = []
        self._mem_taints = {}
        self._mem_taints_checkpoints = []
        self._whole_memory_tainted_checkpoints = []
        self._curr_dest_regs_sizes = {}
        self._curr_taint = set()
        self._full_input_taint = _TaintedValue(0, 0, self._input_hash)\

        raise NotImplementedError("This class and its subclasses are no longer maintained."
                                  "If you need this functionality, please contact the maintainers")
        # NOTE: search for FIXME comments for a list of known issues in this class

    def _load_input(self, input_: InputData) -> None:
        # FIXME:
        # _load_input interface no longer exists; this functionality should be moved
        #    another method (reset() is a good candidate)
        self._input_hash = hash(input_)
        self._full_input_taint = _TaintedValue(0, 0, self._input_hash)
        self._curr_observation = set()
        self._curr_dest_regs = []
        self._curr_dest_regs_sizes = {}
        self._curr_mem_load = (-1, -1)
        self._curr_mem_store = (-1, -1)
        self._curr_taint = set()
        self._curr_src_tainted = False
        assert len(self._reg_taints) == 0
        assert len(self._reg_taints_checkpoints) == 0
        assert len(self._mem_taints) == 0
        assert len(self._mem_taints_checkpoints) == 0
        assert not self._whole_memory_tainted
        assert len(self._whole_memory_tainted_checkpoints) == 0
        # super()._load_input(input_)

    def _assemble_reg_values(self, regs: Set[str]) -> Tuple[Taint, bool]:
        """
        Aggregate value of all registers in regs.
        If register is tainted, use taint instead.
        Set _curr_src_tainted to true if one of the registers was tainted.
        Returns set of register values (usable as taints) and Boolean flag
          to indicate if one of the registers was tainted.
        """

        reg_values = set()
        reg_values_tainted = False

        for reg in regs:
            if reg in self._reg_taints:
                reg_values.update(self._reg_taints[reg])
                # remember that one of registers was tainted
                reg_values_tainted = True
            else:
                reg_id = self._uc_target_desc.reg_norm_to_constant[reg]
                reg_value: int = self._emulator.reg_read(reg_id)  # type: ignore
                # if register is a flag, project flags register on flag
                if reg in {"CF", "PF", "AF", "ZF", "SF", "TF", "IF", "DF", "OF"}:
                    reg_value = int((reg_value & _FLAG_NAME_TO_BITMASK[reg]) != 0)
                pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
                reg_values.add(_TaintedValue(pc, reg_id, reg_value))
                print(f"reg: {reg_id}, value: {reg_value}, pc: {pc}")

        return reg_values, reg_values_tainted

    def _set_taint(self, reg: str, taint: Taint) -> None:
        # sets reg to taint, only uses input hash if included in taint
        if self._full_input_taint in taint:
            self._reg_taints[reg] = {self._full_input_taint}
        else:
            self._reg_taints[reg] = taint

    def _update_reg_taints(self) -> None:
        """
        update current destination registers according to current taint
        special cases:
          1) only lower bits of register are updated, so also keep old taint
          2) current source is not tainted, but destination is tainted,
             so update taint of destination with current values of register
        """
        for reg in self._curr_dest_regs:
            # check if destination reg is already tainted
            if reg in self._reg_taints:
                # check if reg is a register, not a flag, and whether only lower bits are
                # overwritten if this is the case, we need to keep the old taint of reg
                if reg in self._curr_dest_regs_sizes and self._curr_dest_regs_sizes[reg] < 64:
                    new_taint = self._reg_taints[reg] | self._curr_taint
                    self._set_taint(reg, new_taint)
                # else, old taint is overwritten if the source is currently tainted
                elif self._curr_src_tainted:
                    self._set_taint(reg, self._curr_taint)
                # if source is not tainted and destination is overwritten, remove old taint
                else:
                    self._reg_taints.pop(reg, None)
            # if destination is not tainted already, only need to propagate source taints
            elif self._curr_src_tainted:
                # check if reg is a register, not a flag, and whether only lower bits are
                # overwritten if yes, then keep value currently in register as taint
                if reg in self._curr_dest_regs_sizes and self._curr_dest_regs_sizes[reg] < 64:
                    reg_id = self._uc_target_desc.reg_norm_to_constant[reg]
                    reg_value: int = self._emulator.reg_read(reg_id)  # type: ignore
                    pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
                    new_taint = {_TaintedValue(pc, reg_id, reg_value)} | self._curr_taint
                    self._set_taint(reg, new_taint)
                # if not, just set current taint as taint of reg
                else:
                    self._set_taint(reg, self._curr_taint)

    def _get_curr_load_taint(self) -> _TaintedValue:
        address = self._curr_mem_load[0]
        size = self._curr_mem_load[1]
        mem_value = self._emulator.mem_read(address, size)
        mem_value_int = int.from_bytes(mem_value, 'little')
        pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
        return _TaintedValue(pc, address, mem_value_int)

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # start speculation
        # set the rollback address
        self._checkpoint(self._get_rollback_address())

        # only collect new taints if none of the src operands in the faulting instruction are
        # tainted if they are, the taints have been propagated correctly already,code_start
        # so just ignore fault
        if not self._curr_src_tainted:

            # collect registers occurring in src and destination operands
            # src_regs = src registers occurring outside memory load
            # dest_regs = dest registers occurring outside memory store
            # mem_src_regs = src registers occurring as part of address
            # mem_dest_regs = dest registers occurring as part of store
            src_regs = set()
            for op in self._model.state.current_instruction.get_all_operands():
                if isinstance(op, RegisterOp):
                    if op.src:
                        op_normalized = self._target_desc.reg_normalized[op.value]
                        src_regs.add(op_normalized)
                        # src_regs_sizes[op_normalized] = op.width
                    if op.dest:
                        op_normalized = self._target_desc.reg_normalized[op.value]
                        self._curr_dest_regs.append(op_normalized)
                        self._curr_dest_regs_sizes[op_normalized] = op.width
                elif isinstance(op, FlagsOp):
                    src_regs.update(op.get_flags_by_type('read'))
                    self._curr_dest_regs.extend(op.get_flags_by_type('write'))

            # source_values = evaluated load address + values of src regs
            # these are all the values the faulting instruction depends on
            self._curr_taint, _ = self._assemble_reg_values(src_regs)

            if self._model.state.current_instruction.has_read():
                self._curr_taint.add(self._get_curr_load_taint())

            if self._model.state.current_instruction.has_write():
                address = self._curr_mem_store[0]
                size = self._curr_mem_store[1]
                for i in range(size):
                    self._mem_taints[address + i] = self._curr_taint

            # need to set _curr_src_tainted to make update_reg_taints call work
            self._curr_src_tainted = True
            self._update_reg_taints()

        return self._get_next_instruction()

    def _get_next_instruction(self) -> int:
        # speculatively skip the faulting instruction
        if self._model.state.is_exit_addr(self._next_instruction_addr):
            return 0  # no need for speculation if we're at the end
        return self._next_instruction_addr

    def _speculate_instruction(self, address: int, size: int) -> None:
        """
        Track how taints move through system and produce correct observations.
        """
        # check that the instruction size is correct (may be wrong for invalid instructions)
        if self._model.state.current_instruction.size() not in [0, size]:
            size = self._model.state.current_instruction.size()
        self._next_instruction_addr = address + size

        # print('current taints:', self.reg_taints, self.mem_taints)
        # print('current instruction:', self._model.state.current_instruction)

        # reset observation set and rvzr/dest registers
        # this must happen before we check if we can skip, otherwise trace_mem_access might
        # use old values
        self._curr_observation = set()
        self._curr_taint = set()
        self._curr_dest_regs = []
        self._curr_dest_regs_sizes = {}
        self._curr_src_tainted = False
        # might be needed when contract is refined recording which part of register is tainted
        # src_regs_sizes = dict()

        # track taints only after faults with non-empty taints
        if not self._in_speculation or (not self._reg_taints and not self._mem_taints):
            return

        src_regs = set()
        mem_src_regs = set()
        mem_dest_regs = set()

        # assemble source and destination registers of instruction
        # distinguish between normal registers and registers used in memory access
        # some code duplication, with method _speculate_fault()
        for op in self._model.state.current_instruction.get_all_operands():
            if isinstance(op, RegisterOp):
                if op.src:
                    op_normalized = self._target_desc.reg_normalized[op.value]
                    src_regs.add(op_normalized)
                    # src_regs_sizes[op_normalized] = op.width
                if op.dest:
                    op_normalized = self._target_desc.reg_normalized[op.value]
                    self._curr_dest_regs.append(op_normalized)
                    self._curr_dest_regs_sizes[op_normalized] = op.width
            elif isinstance(op, MemoryOp):
                for sub_op in re.split(r'\+|-|\*| ', op.value):
                    if sub_op and sub_op in self._target_desc.reg_normalized:
                        normalized = self._target_desc.reg_normalized[sub_op]
                        if op.src:
                            mem_src_regs.add(normalized)
                        if op.dest:
                            mem_dest_regs.add(normalized)
            elif isinstance(op, FlagsOp):
                # print('read flags:', op.get_flags_by_type('read'))
                # print('write flags:', op.get_flags_by_type('write'))
                src_regs.update(op.get_flags_by_type('read'))
                self._curr_dest_regs.extend(op.get_flags_by_type('write'))
            elif isinstance(op, AgenOp):
                assert self._model.state.current_instruction.name == "lea"
                assert op.src
                for sub_op in re.split(r'\[|\]|\+|-|\*| ', op.value):
                    if sub_op and sub_op in self._target_desc.reg_normalized:
                        normalized = self._target_desc.reg_normalized[sub_op]
                        src_regs.add(normalized)

        # assemble values of memory dest registers. if tainted, use taint instead
        mem_dest_reg_values, _ = self._assemble_reg_values(mem_dest_regs)

        # check if instruction attempted store using tainted register
        #     => location of store unknown
        tainted_mem_dest_regs = mem_dest_regs & self._reg_taints.keys()
        if tainted_mem_dest_regs:
            assert self._model.state.current_instruction.has_write()
            # record observation of store
            # leaks taint if tainted register is used
            self._curr_observation = self._curr_observation | mem_dest_reg_values
            # as destination is not known, whole memory is tainted (implicitly with input hash)
            self._whole_memory_tainted = True
            # TODO: can we write to registers and memory within one instruction? if not, return
            # if yes, other destination registers might get tainted, so continue

        # assemble values of memory src registers. if tainted, use taint instead
        mem_src_reg_values, _ = self._assemble_reg_values(mem_src_regs)

        # check if instruction attempted load using tainted register
        #     => location of load unknown
        tainted_mem_src_regs = mem_src_regs & self._reg_taints.keys()

        if tainted_mem_src_regs and not self._model.state.current_instruction.name == "lea":
            assert self._model.state.current_instruction.has_read()
            # record observation of load
            # leaks taint if tainted register is used
            self._curr_observation = self._curr_observation | mem_src_reg_values
            # load from tainted value returns content of unknown address
            #     => taint dest registers with input hash (represents full architectural state)
            # remember current taint in case store address needs to be tainted in trace_mem_access()
            self._curr_taint = {self._full_input_taint}
            for reg in self._curr_dest_regs:
                self._reg_taints[reg] = self._curr_taint
            # remember that instruction depended on tainted operand
            self._curr_src_tainted = True
            # all dest regs are tainted with maximal taint, we can return
            return

        # assemble value of all src regs, use taint if tainted
        self._curr_taint, self._curr_src_tainted = self._assemble_reg_values(src_regs)
        self._update_reg_taints()

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        # remember last address and size in case of exception
        if access != UC_MEM_WRITE:
            self._curr_mem_load = (address, size)
        else:
            self._curr_mem_store = (address, size)

        if not self._in_speculation:
            # FIXME: this branch should enable/disable tracing via self._model.tracer.enable_tracing
            return

        mem_value = self._model.emulator.mem_read(address, size)

        if access != UC_MEM_WRITE:
            # for loads, check if address is tainted
            # Test if any address in the range of address+size is tainted
            is_tainted: bool = False
            taints = set()
            for i in range(size):
                if address + i in self._mem_taints:
                    is_tainted = True
                    taints.update(self._mem_taints[address + i])

            # add address taint to current taint
            if is_tainted:
                self._curr_taint.update(taints)
            elif self._whole_memory_tainted:
                self._curr_taint.add(self._full_input_taint)

            if is_tainted or self._whole_memory_tainted:
                # remember that instruction used tainted src value and update taint of dest
                # registers with address taint
                self._curr_src_tainted = True
                self._update_reg_taints()
            else:
                # if address itself is not tainted, value stored at address to current taint
                # and potentially add to taints
                mem_value_int = int.from_bytes(mem_value, 'little')
                pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
                self._curr_taint.add(_TaintedValue(pc, address, mem_value_int))
                self._update_reg_taints()

        if access == UC_MEM_WRITE:
            # check if any src operand was tainted (memory location or register)
            if not self._curr_src_tainted:
                # if there is no current taint, remove possible taint from current address range
                for i in range(size):
                    self._mem_taints.pop(address + i, None)
            # if src was tainted, add current taint to current address range
            #     check if whole memory is already tainted, then nothing has to be done
            elif not self._whole_memory_tainted:
                for i in range(size):
                    self._mem_taints[address + i] = self._curr_taint

        # check if the memory access creates a tainted observation
        if self._curr_observation:
            # if current observation contains full architectural state info, then only leak the hash
            if self._full_input_taint in self._curr_observation:
                self._curr_observation = {self._full_input_taint}
            observation_list = list(self._curr_observation)
            observation_list.sort()
            # print('leaking observation', observation_list)
            # observation_hash = hash(tuple(observation_list))
            # just append hash to trace, don't do normal memory access
            # FIXME: this should be replaced with a public call to the tracer
            # self._model.tracer._add_dependencies_to_trace(observation_hash)
        # if not, do normal memory access
        else:
            pass
            # FaultSpeculator.trace_mem_access(emulator, access, address, size, value, model)

    def _checkpoint(self, next_instruction_addr: int, include_current_inst: bool = True) -> None:
        self._reg_taints_checkpoints.append(copy(self._reg_taints))
        self._mem_taints_checkpoints.append(copy(self._mem_taints))
        self._whole_memory_tainted_checkpoints.append(copy(self._whole_memory_tainted))
        return super()._checkpoint(next_instruction_addr, include_current_inst=include_current_inst)

    def rollback(self) -> int:
        self._reg_taints = self._reg_taints_checkpoints.pop()
        self._mem_taints = self._mem_taints_checkpoints.pop()
        self._whole_memory_tainted = self._whole_memory_tainted_checkpoints.pop()
        return super().rollback()

    def _get_rollback_address(self) -> int:
        # faults end program execution
        return self._model.state.fault_handler_addr


class VspecDIVSpeculator(_VspecBaseSpeculator):
    """ Operand value speculation on division errors """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        # DIV exceptions only
        self._errno_that_trigger_speculation = {21}


class VspecMemoryFaultsSpeculator(_VspecBaseSpeculator):
    """ Operand value  speculation on page faults """

    pending_restore_protection: bool = False
    pending_re_execution: bool = False

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        # Page faults and other memory errors
        self._errno_that_trigger_speculation = {6, 7, 12, 13}

    def _get_curr_load_taint(self) -> _TaintedValue:
        # The loaded value is undefined for faulting loads,
        # hence the memory value should not be included in dependencies
        load_addr = self._curr_mem_load[0]
        pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
        return _TaintedValue(pc, load_addr, 0)

    def _speculate_instruction(self, address: int, size: int) -> None:
        if self.pending_restore_protection:
            self.pending_restore_protection = False
            # FIXME: this is outdated;
            # see speculator_faults.py:X86UnicornNull for a maintained implementation
            # of a similar algorithm
            # aid = self._model.state.current_actor.get_id()
            # if self.rw_forbidden[aid]:
            #     self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), False,
            #                                    False)
            # elif self.w_forbidden[aid]:
            #     self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True,
            #                                    False)
        elif self.pending_re_execution:
            self.pending_re_execution = False
            self.pending_restore_protection = True
        super()._speculate_instruction(address, size)

    def _get_next_instruction(self) -> int:
        if self._model.state.is_exit_addr(self._next_instruction_addr):
            return 0  # no need for speculation if we're at the end

        # FIXME: uses outdated interfaces
        # aid = self.current_actor.get_id()
        # if self.pending_fault == UC_ERR_WRITE_PROT and self.w_forbidden[aid]:
        #     # remove protection
        #     self._model.set_faulty_area_rw(self.current_actor.get_id(), True, True)
        #     self.pending_re_execution = True
        #     return self._curr_instruction_addr
        return self._next_instruction_addr


class VspecMemoryAssistsSpeculator(VspecMemoryFaultsSpeculator):
    """ Operand value  speculation on page faults with memory assists """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {12, 13}

    def rollback(self) -> int:
        next_instruction = super().rollback()
        if not self._in_speculation:
            # remove protection after the assists has completed
            self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True, True)

        return next_instruction

    def _get_rollback_address(self) -> int:
        if self._in_speculation:
            return self._model.state.fault_handler_addr
        return self._curr_instruction_addr


class VspecGPSpeculator(_VspecBaseSpeculator, X86NonCanonicalAddress):
    """ Operand value  speculation on General Protection Faults """

    address_register: int
    register_value: int

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation.update([6, 7])

    # def _speculate_fault(self, errno: int) -> int:
    #     if not self._fault_triggers_speculation(errno):
    #         return 0

    #     self._checkpoint(self._model.state.fault_handler_addr)
    #     self.faulty_instruction_addr = self._curr_instruction_addr
    #     return self._curr_instruction_addr

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # only collect new taints if none of the src operands in the faulting instruction are
        # tainted if they are, the taints have been propagated correctly already,code_start
        # so just ignore fault
        if not self._curr_src_tainted:

            # collect registers occurring in src and destination operands
            # src_regs = src registers occurring outside memory load
            # dest_regs = dest registers occurring outside memory store
            # mem_src_regs = src registers occurring as part of address
            # mem_dest_regs = dest registers occurring as part of store
            src_regs = set()
            for op in self._model.state.current_instruction.get_all_operands():
                if isinstance(op, RegisterOp):
                    if op.src:
                        op_normalized = self._target_desc.reg_normalized[op.value]
                        src_regs.add(op_normalized)
                        # src_regs_sizes[op_normalized] = op.width
                    if op.dest:
                        op_normalized = self._target_desc.reg_normalized[op.value]
                        self._curr_dest_regs.append(op_normalized)
                        self._curr_dest_regs_sizes[op_normalized] = op.width
                elif isinstance(op, FlagsOp):
                    src_regs.update(op.get_flags_by_type('read'))
                    self._curr_dest_regs.extend(op.get_flags_by_type('write'))

            # source_values = evaluated load address + values of src regs
            # these are all the values the faulting instruction depends on
            self._curr_taint, _ = self._assemble_reg_values(src_regs)

            if self._model.state.current_instruction.has_read():
                address = self._curr_mem_load[0]
                address = self._noncanonical_to_canonical(address)
                size = self._curr_mem_load[1]
                mem_value = self._emulator.mem_read(address, size)
                mem_value_int = int.from_bytes(mem_value, 'little')
                pc = self._model.layout.code_addr_to_offset(self._curr_instruction_addr)
                self._curr_taint.add(_TaintedValue(pc, address, mem_value_int))

            if self._model.state.current_instruction.has_write():
                address = self._curr_mem_store[0]
                address = self._noncanonical_to_canonical(address)
                size = self._curr_mem_store[1]
                for i in range(size):
                    self._mem_taints[address + i] = self._curr_taint

            # need to set _curr_src_tainted to make update_reg_taints call work
            self._curr_src_tainted = True
            self._update_reg_taints()

        # speculatively skip the faulting instruction
        return self._curr_instruction_addr

    def _speculate_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        if self._curr_instruction_addr == self.faulty_instruction_addr:
            if access != UC_MEM_WRITE:
                self._curr_mem_load = (address, size)
            else:
                self._curr_mem_store = (address, size)
            self._speculate_fault(6)
        super()._speculate_mem_access(access, address, size, value)

    def _speculate_instruction(self, address: int, size: int) -> None:
        super(X86NonCanonicalAddress, self)._speculate_instruction(address, size)
        if address != self.faulty_instruction_addr:
            super(_VspecBaseSpeculator, self)._speculate_instruction(address, size)

    def _noncanonical_to_canonical(self, address: int) -> int:
        if address & (1 << 47):  # bit 48 is 1 => high address
            address = address | 0xFFFF800000000000
        else:  # bit 48 is 0 => low address
            address = address & 0x00007FFFFFFFFFF
        return address

    def _get_rollback_address(self) -> int:
        return self._model.state.fault_handler_addr

    def reset(self) -> None:
        self.faulty_instruction_addr = -1
        self.address_register = -1
        self.register_value = -1
        return super().reset()


class VspecAllSpeculator(_VspecBaseSpeculator):
    """
    Most permissive contract.
    Uses vspec-unknown contract but destination operands in case of
    exception depends on full architectural state (= on full input)
    instead of value of src operands.
    """

    def _speculate_fault(self, errno: int) -> int:
        if not self._fault_triggers_speculation(errno):
            return 0

        # start speculation
        # store a checkpoint
        self._checkpoint(self._get_rollback_address())

        # only collect new taints if none of the src operands in the faulting instruction are
        # tainted if they are, the taints have been propagated correctly already,
        # so just ignore fault
        if not self._curr_src_tainted:

            for op in self._model.state.current_instruction.get_all_operands():
                if isinstance(op, RegisterOp):
                    if op.dest:
                        self._curr_dest_regs.append(self._target_desc.reg_normalized[op.value])
                elif isinstance(op, FlagsOp):
                    self._curr_dest_regs.extend(op.get_flags_by_type('write'))

            if self._model.state.current_instruction.has_write():
                address = self._curr_mem_store[0]
                size = self._curr_mem_store[1]
                for i in range(size):
                    self._mem_taints[address + i] = {self._full_input_taint}

            # taint destination registers with hash of full input (represents architectural state)
            for reg in self._curr_dest_regs:
                self._reg_taints[reg] = {self._full_input_taint}

        return self._get_next_instruction()


class VspecAllDIVSpeculator(VspecAllSpeculator):
    """ Any-value speculation on division errors """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        # DIV exceptions only
        self._errno_that_trigger_speculation = {21}


class VspecAllMemoryFaultsSpeculator(VspecAllSpeculator):
    """ Any-value speculation on page faults """

    pending_restore_protection: bool = False
    pending_re_execution: bool = False

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        # Page faults and other memory errors
        self._errno_that_trigger_speculation = {6, 7, 12, 13}

    def _speculate_instruction(self, address: int, size: int) -> None:
        if self.pending_restore_protection:
            self.pending_restore_protection = False
            # FIXME: this is outdated;
            # see speculator_faults.py:X86UnicornNull for a maintained implementation
            # of a similar algorithm
            # aid = self._model.state.current_actor.get_id()
            # if self.rw_forbidden[aid]:
            #     self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), False,
            #                                    False)
            # elif self.w_forbidden[aid]:
            #     self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True,
            #                                    False)
        elif self.pending_re_execution:
            self.pending_re_execution = False
            self.pending_restore_protection = True
            return
        super()._speculate_instruction(address, size)

    def _get_next_instruction(self) -> int:
        if self._model.state.is_exit_addr(self._next_instruction_addr):
            return 0  # no need for speculation if we're at the end

        # FIXME: uses outdated interfaces
        # aid = self.current_actor.get_id()
        # if self.pending_fault == UC_ERR_WRITE_PROT and self.w_forbidden[aid]:
        #     # remove protection
        #     self._model.set_faulty_area_rw(self.current_actor.get_id(), True, True)
        #     self.pending_re_execution = True
        #     return self._curr_instruction_addr
        return self._next_instruction_addr


class VspecAllMemoryAssistsSpeculator(VspecAllSpeculator):
    """ Any-value speculation on A/D-bit microcode assists (MDS style) """

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        self._errno_that_trigger_speculation = {12, 13}

    def rollback(self) -> int:
        next_instruction = super().rollback()
        if not self._in_speculation:
            # remove protection after the assists has completed
            self._model.set_faulty_area_rw(self._model.state.current_actor.get_id(), True, True)
        return next_instruction

    def _get_rollback_address(self) -> int:
        if self._in_speculation:
            return self._model.state.fault_handler_addr
        return self._curr_instruction_addr


================================================
FILE: rvzr/model_unicorn/taint_tracker.py
================================================
"""
File: Taint tracking implementation for the Unicorn model

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import copy
import re
from typing import List, Optional, Set, Dict, TYPE_CHECKING, Literal, Final
from typing_extensions import assert_never

from ..tc_components.instruction import Instruction, RegisterOp, FlagsOp, \
    MemoryOp, AgenOp, ImmediateOp, LabelOp, CondOp
from ..tc_components.test_case_data import InputTaint
from ..target_desc import TargetDesc
from ..sandbox import SandboxLayout, DataArea
from ..config import CONF

if TYPE_CHECKING:
    from ..target_desc import UnicornTargetDesc
    from ..sandbox import BaseAddrTuple, DataAddr

TAINTED_VALUE_TYPE = Literal["pc", "mem", "ld_val"]
_ARCH_INITIAL_OBSERVATIONS_X86_64 = [
    "A", "B", "C", "D", "SI", "DI", "RSP", "CF", "PF", "AF", "ZF", "SF", "TF", "IF", "DF", "OF",
    "AC"
]
_ARCH_INITIAL_OBSERVATIONS_ARM64 = ["R0", "R1", "R2", "R3", "R4", "R5", "N", "Z", "C", "V"]


# ==================================================================================================
# Public Interface: Taint Tracker
# ==================================================================================================
class UnicornTaintTracker:
    """
    Tracking of the input data that impacts contract traces.

    The algorithm is as follows:
    - start_instruction: get the static source and destination operands of the instruction
    - track_memory_access: get dynamic source and destination memory addresses
    - taint: collect the labels (register names or mem. addresses) that are
      exposed by this instruction in the contract trace
    - finalize_instruction:
      1. propagate the dependencies of the source operands to the destination operands
      2. update the list of tainted labels with the dependencies of the labels
         collected by taint_* methods
    - get_taint: produce an InputTaint object based on the all tainted labels
    """
    _enable_tracking: bool = True
    _tracking_in_progress: bool = False

    _initial_observations: List[str]
    _data_start: Final[DataAddr]
    _uc_target_desc: Final[UnicornTargetDesc]
    _target_desc: Final[TargetDesc]

    _checkpoints: List[_Dependencies]
    _tainted_labels: Set[str]
    _pending_taint: Set[str]

    _instruction: Optional[_TrackedInstruction] = None
    _dependencies: _Dependencies

    def __init__(self, bases: BaseAddrTuple, target_desc: TargetDesc):
        assert CONF.instruction_set in ["x86-64", "arm64"], \
               "Taint tracking is only supported for x86_64 and arm64"

        self._data_start = bases[0]
        self._target_desc = target_desc
        self._uc_target_desc = target_desc.uc_target_desc

        # Certain types of contracts have predefined observations
        if CONF.contract_observation_clause in ('ctr', 'arch'):
            if CONF.instruction_set == "x86-64":
                self._initial_observations = _ARCH_INITIAL_OBSERVATIONS_X86_64
            elif CONF.instruction_set == "arm64":
                self._initial_observations = _ARCH_INITIAL_OBSERVATIONS_ARM64
        else:
            self._initial_observations = []

        self.reset()
        self._tracking_in_progress = False

    # ----------------------------------------------------------------------------------------------
    # State management methods
    def set_enable_tracking(self, enable: bool) -> None:
        """ Enable or disable the taint tracking """
        assert self._tracking_in_progress is False, \
            "Cannot change tracking mode before get_taint() is called"
        self._enable_tracking = enable

    def reset(self) -> None:
        """ Reset the taint tracker to its initial state """
        self._checkpoints = []
        self._tainted_labels = set(self._initial_observations)
        self._pending_taint = set()
        self._instruction = None
        self._dependencies = _Dependencies()
        self._tracking_in_progress = True

    def checkpoint(self, include_current_inst: bool) -> None:
        """
        Save the current state of the taint tracker
        :param include_current_inst: if True, include the current instruction in the checkpoint
        """
        if not self._enable_tracking:
            return

        if include_current_inst and self._instruction is not None:
            self._finalize_instruction()
        self._checkpoints.append(copy.deepcopy(self._dependencies))

    def rollback(self) -> None:
        """
        Restore the state of the taint tracker from the top-most checkpoint
        :raises AssertionError: if there are no more checkpoints
        """
        if not self._enable_tracking:
            return

        assert self._checkpoints, "There are no more checkpoints"
        if self._instruction is not None:
            self._finalize_instruction()
        self._dependencies = copy.deepcopy(self._checkpoints.pop())

    # ----------------------------------------------------------------------------------------------
    # Dependency propagation methods
    def track_instruction(self, instruction: Instruction) -> None:
        """
        Parse instruction and record its static source and destination operands.
        Static means the operands that we can identify without executing the instruction.
        The remaining dynamic operands are collected by track_* methods.
        :param instruction: the instruction to be parsed
        """
        if not self._enable_tracking:
            return

        # make sure that the previous instruction is finalized
        if self._instruction:
            self._finalize_instruction()

        # restart the tracking
        # print("-----------------------------------")
        self._instruction = _TrackedInstruction(instruction)
        self._instruction.parse_static_operands(self._target_desc.reg_normalized)
        self._pending_taint = set()

        # overwrite stale flag dependencies
        # FIXME: this feels like it should be in _finalize_instruction?
        flag_op = self._instruction.inst.get_flags_operand()
        if flag_op:
            for flag_label in flag_op.get_flags_by_type('overwrite'):
                self._dependencies.flag[flag_label] = {flag_label}

    def track_memory_access(self, address: int, size: int, is_write: bool) -> None:
        """
        Add the address of the memory access to the list of current instruction dependencies
        :param address: the address of the memory access
        :param size: the size of the memory access
        :param is_write: True if the memory access is a write (store), False if it's a read (load)
        """
        if not self._enable_tracking:
            return

        assert self._instruction, "track_memory_access called before track_instruction"

        # mask the address - we taint at the granularity of 8 bytes
        address -= self._data_start
        masked_start_addr = address & 0xffff_ffff_ffff_fff8
        end_addr = address + (size - 1)
        masked_end_addr = end_addr & 0xffff_ffff_ffff_fff8

        # add all addresses to tracking
        for i in range(masked_start_addr, masked_end_addr + 1, 8):
            if is_write:
                self._instruction.dest_mems.add(hex(i))
            else:
                self._instruction.src_mems.add(hex(i))

    def _finalize_instruction(self) -> None:
        """
        Propagate dependencies and record the taints of the tracked instruction
        :raises AssertionError: if called before track_instruction
        """
        assert self._instruction, "_finalize_instruction called before track_instruction"
        inst = self._instruction.inst
        inst_name = inst.name.lower()

        # Extract dependencies of the tracked instruction
        self._dependencies.add_dependencies(self._instruction)

        # Workaround for REP instructions with implicit RCX dependency
        if self._pending_taint and "rep" in inst_name and "C" in self._instruction.src_regs:
            self._pending_taint.add('C')

        # Update taints
        # print(self._pending_taint)
        for label in self._pending_taint:
            if label.startswith("0x"):
                tainted_values = self._dependencies.mem.get(label, {label})
            else:
                tainted_values = self._dependencies.reg.get(label, {label})
            self._tainted_labels.update(tainted_values)
        # print(self._tainted_labels)

        # Clear the dependencies of the overwritten registers
        # NOTE: this must be done *after* the taint update, or the taints will be lost
        self._dependencies.remove_overwritten_dependencies(self._instruction, self._target_desc)

        # Reset the instruction
        self._instruction = None

    # ----------------------------------------------------------------------------------------------
    # Tainting callback
    def taint(self, value_type: TAINTED_VALUE_TYPE) -> None:
        """
        Taint the operands of a given type for the tracked instruction
        (tracked instruction is the last instruction on which track_instruction was called)

        :param value_type: the type of the value to be tainted
        """
        if not self._enable_tracking:
            return

        if not self._instruction:
            return

        # Taint the program counter
        if value_type == "pc":
            if self._instruction and self._instruction.inst.is_control_flow:
                self._pending_taint.add("RIP")
            return

        # Taint the memory addresses accessed by the instruction
        if value_type == "mem":
            for reg in self._instruction.mem_address_regs:
                self._pending_taint.add(reg)
            return

        # Taint the loaded value
        if value_type == "ld_val":
            for addr in self._instruction.src_mems:
                self._pending_taint.add(addr)
            return
        assert_never(value_type)

    def taint_actors(self, actor_ids: List[int]) -> None:
        """
        Taint all the memory addresses of the actors in the list
        :param actor_ids: the list of actor IDs
        """
        data_size_per_actor = SandboxLayout.data_size_per_actor()
        for actor_id in actor_ids:
            actor_offset = actor_id * data_size_per_actor
            for i in range(actor_offset, actor_offset + data_size_per_actor, 8):
                self._tainted_labels.add(hex(i))

    # ----------------------------------------------------------------------------------------------
    # Taint output
    def get_taint(self, n_actors: int) -> InputTaint:
        """
        Produce an InputTaint object based on the taints collected during
        the model execution.
        :param n_actors: the number of actors in the test case
        :return: an InputTaint object
        """
        # pylint: disable=too-many-locals
        # NOTE: justified, because we have many variable that define area boundaries

        if not self._enable_tracking:
            self._tracking_in_progress = False
            return InputTaint(n_actors)

        if self._instruction:
            self._finalize_instruction()

        taint = InputTaint(n_actors)
        tainted_sandbox_addresses: List[int] = []
        register_start = SandboxLayout.data_area_offset(DataArea.GPR)
        simd_start = SandboxLayout.data_area_offset(DataArea.SIMD)

        for label in self._tainted_labels:
            # Memory address
            if label.startswith('0x'):
                sandbox_address = int(label, 16)
                tainted_sandbox_addresses.append(sandbox_address)
                continue

            # Register
            reg = self._uc_target_desc.reg_norm_to_constant[label]
            registers = self._uc_target_desc.usable_registers
            if reg in registers:
                sandbox_address = register_start + registers.index(reg) * 8
                tainted_sandbox_addresses.append(sandbox_address)
                continue

            # SIMD register
            simd_registers = self._uc_target_desc.usable_simd128_registers
            if reg in simd_registers:
                sandbox_address = simd_start + simd_registers.index(reg) * 16
                tainted_sandbox_addresses.append(sandbox_address)
                tainted_sandbox_addresses.append(sandbox_address + 1)
            # else:
            # print(f"Register {label} is not tracked")

        tainted_sandbox_addresses.sort()
        taint_offsets = [
            InputTaint.taint_offset_from_sandbox_address(pos) for pos in tainted_sandbox_addresses
        ]

        for actor_id in range(0, n_actors):
            actor_area_start = actor_id * InputTaint.per_actor_taint_size
            actor_area_end = (actor_id + 1) * InputTaint.per_actor_taint_size
            actor_taints = [
                pos - actor_area_start
                for pos in taint_offsets
                if actor_area_start <= pos < actor_area_end
            ]
            taint.taint_actor_offsets(actor_id, actor_taints)

        self._tracking_in_progress = False
        return taint


# ==================================================================================================
# Private: Service Classes
# ==================================================================================================
class _TrackedInstruction:
    """
    A private data class that holds the source and destination operands of the tracked instruction
    """

    def __init__(self, instruction: Instruction) -> None:
        self.inst = instruction

        self.src_regs: Set[str] = set()
        self.dest_regs: Set[str] = set()

        self.src_flags: Set[str] = set()
        self.dest_flags: Set[str] = set()

        self.src_mems: Set[str] = set()
        self.dest_mems: Set[str] = set()

        self.mem_address_regs: Set[str] = set()

    def parse_static_operands(self, reg_normalizer: Dict[str, str]) -> None:
        """
        Set the source and destination operands of the instruction.
        :param reg_normalizer: a dictionary that maps register names to their normalized names
        :return: None
        """
        for op in self.inst.get_all_operands():
            # Registers: normalize the names and record them
            if isinstance(op, RegisterOp):
                value = reg_normalizer[op.value]
                if op.src:
                    self.src_regs.add(value)
                if op.dest:
                    self.dest_regs.add(value)
                continue

            # Flags: record the read and write flags; also record the undefined flags
            if isinstance(op, FlagsOp):
                self.src_flags = set(op.get_flags_by_type('read'))
                self.src_flags.update(op.get_flags_by_type('undef'))
                self.dest_flags = set(op.get_flags_by_type('write'))
                continue

            # Memory: record the names of the address registers
            if isinstance(op, MemoryOp):
                for sub_op in re.split(r'\+|-|\*| ', op.value):
                    if sub_op and sub_op in reg_normalizer:
                        self.mem_address_regs.add(reg_normalizer[sub_op])
                continue

            if isinstance(op, AgenOp):
                # LEA operand: record the names of the address registers
                # Note that we record the names in self.src_regs, because it's not a memory access
                for sub_op in re.split(r'\+|-|\*| ', op.value):
                    if sub_op and sub_op in reg_normalizer:
                        self.src_regs.add(reg_normalizer[sub_op])
                continue

            # Immediate, Label, and Condition: do nothing
            if isinstance(op, (ImmediateOp, LabelOp, CondOp)):
                continue

            assert_never(op)


class _Dependencies:
    """
    A private data class that tracks all dependencies collected by UnicornTaintTracker
    """
    _cached_src_dependencies: Optional[Set[str]]

    def __init__(self) -> None:
        self.reg: Dict[str, Set[str]] = {}
        self.flag: Dict[str, Set[str]] = {}
        self.mem: Dict[str, Set[str]] = {}

    def add_dependencies(self, tracked_inst: _TrackedInstruction) -> None:
        """
        Update the dependencies with the source and destination operands of the tracked instruction
        """

        # Get dependencies of the source operands
        src_dependencies = set()
        for reg in tracked_inst.src_regs:
            src_dependencies.update(self.reg.get(reg, {reg}))
        for flag in tracked_inst.src_flags:
            src_dependencies.update(self.flag.get(flag, {flag}))
        for addr in tracked_inst.src_mems:
            src_dependencies.update(self.mem.get(addr, {addr}))
        self._cached_src_dependencies = src_dependencies

        # Propagate source dependencies to destination operands
        for reg in tracked_inst.dest_regs:
            if reg in self.reg:
                self.reg[reg].update(src_dependencies)
            else:
                self.reg[reg] = copy.copy(src_dependencies)
                self.reg[reg].add(reg)
        for flg in tracked_inst.dest_flags:
            if flg in self.flag:
                self.flag[flg].update(src_dependencies)
            else:
                self.flag[flg] = copy.copy(src_dependencies)
                self.flag[flg].add(flg)
        for mem in tracked_inst.dest_mems:
            if mem in self.mem:
                self.mem[mem].update(src_dependencies)
            else:
                self.mem[mem] = copy.copy(src_dependencies)
                self.mem[mem].add(mem)

        # print(f"reg: dest={tracked_inst.dest_regs}, src={tracked_inst.src_regs}")
        # print(f"flag: dst={tracked_inst.dest_flags}, src={tracked_inst.src_flags}")
        # print(f"mem: dest={tracked_inst.dest_mems}, src={tracked_inst.src_mems}")
        # print(f"all reg={self.reg}")
        # print(f"all flg={self.flag}")
        # print(f"all mem={self.mem}")
        # print("----------------------")

    def remove_overwritten_dependencies(self, tracked_inst: _TrackedInstruction,
                                        target_desc: TargetDesc) -> None:
        """
        Remove the dependencies of the destination operands of the tracked instruction
        """
        assert self._cached_src_dependencies is not None, \
            "remove_overwritten_dependencies must be called after add_dependencies"
        src_dependencies = self._cached_src_dependencies
        self._cached_src_dependencies = None

        # Identify if the instruction overrides previous dependencies
        # (so far we consider only two such case: MOV and LEA)
        # FIXME: this is an x86-specific implementation and it should be moved to the x86 model
        override: bool = False
        inst_name = tracked_inst.inst.name.lower()
        if (inst_name.startswith("mov") or inst_name == "lea") \
           and len(tracked_inst.dest_regs) == 1:
            reg = tracked_inst.inst.get_reg_operands(True)[0].value
            if target_desc.register_sizes.get(reg, 0) == 64:
                override = True

        # If the instruction overrides previous dependencies, remove them
        if override:
            assert len(tracked_inst.dest_regs) == 1, "MOV instruction with multiple destinations"
            reg = tracked_inst.dest_regs.pop()
            for dep in list(self.reg[reg]):
                if dep not in src_dependencies:
                    self.reg[reg].remove(dep)


================================================
FILE: rvzr/model_unicorn/tracer.py
================================================
"""
File: Collection of tracers for the Unicorn backend to the contract model.

      A tracer is a component that record certain events during the execution of a
      test case on the contract model. As such, the tracers implement
      observation clauses of different contracts.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from abc import ABC

from typing import List, TYPE_CHECKING, Optional
from unicorn import UC_MEM_READ
import xxhash

from ..traces import CTrace, CTraceEntry
from ..config import CONF

if TYPE_CHECKING:
    from .model import UnicornModel
    from .taint_tracker import UnicornTaintTracker
    from ..target_desc import TargetDesc, UnicornTargetDesc
    from ..tc_components.test_case_data import InputData
    from ..tc_components.test_case_code import TestCaseProgram


# ==================================================================================================
# Abstract Tracer Interface
# ==================================================================================================
class UnicornTracer(ABC):
    """
    Interface definition that must be implemented by all tracers
    as well as implementation of common functionality.
    """
    trace: List[CTraceEntry]
    enable_tracing: bool = False
    _model: UnicornModel
    _taint_tracker: UnicornTaintTracker
    _uc_target_desc: UnicornTargetDesc
    _test_case: Optional[TestCaseProgram] = None
    _input: Optional[InputData] = None

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__()
        self.trace = []
        self._model = model
        self._taint_tracker = taint_tracker
        self._uc_target_desc = target_desc.uc_target_desc

    # ==============================================================================================
    # Public Interface
    def load_test_case(self, test_case: TestCaseProgram) -> None:
        """ Load the test case into the tracer """
        self._test_case = test_case

    def reset(self, input_: InputData) -> None:
        """
        Initialize/reset the state of the tracer
        for tracing the loaded test case with the given input
        """
        self.trace = []
        self.enable_tracing = False
        self._input = input_

    def get_trace(self) -> CTrace:
        """ Return the collected trace in a form of a CTrace object """

        # make the trace reproducible by normalizing the addresses
        normalized_trace: List[CTraceEntry] = []
        layout = self._model.layout
        for org_entry in self.trace:
            if org_entry.type_ == "pc":
                entry = CTraceEntry("pc", layout.code_addr_to_offset(org_entry.value))
            elif org_entry.type_ == "mem":
                entry = CTraceEntry("mem", layout.data_addr_to_offset(org_entry.value))
            else:
                entry = CTraceEntry(org_entry.type_, org_entry.value)
            normalized_trace.append(entry)
        return CTrace(normalized_trace)

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        """
        Trace a memory access.
        The value may or may not be recorded on the trace, depending on the tracer implementation.
        :param access: type of access (UC_MEM_READ, UC_MEM_WRITE)
        :param address: address of the memory access
        :param size: size of the memory access
        :param value: value read or written
        """

    def observe_instruction(self, pc: int, size: int) -> None:
        """
        Trace an instruction.
        The value may or may not be recorded on the trace, depending on the tracer implementation.
        :param pc: program counter of the instruction
        :param size: size of the instruction
        """

    # ==============================================================================================
    # Private Methods

    def _add_mem_address_to_trace(self, address: int) -> None:
        """ Record the given memory address, if tracing is enabled """
        if self.enable_tracing:
            self.trace.append(CTraceEntry("mem", address))
            self._taint_tracker.taint("mem")

    def _add_pc_to_trace(self, address: int) -> None:
        """ Record the given program counter, if tracing is enabled """
        if self.enable_tracing:
            self.trace.append(CTraceEntry("pc", address))
            self._taint_tracker.taint("pc")

    def _add_dependencies_to_trace(self, dependency_hash: int) -> None:
        """ Record the given dependency hash, if tracing is enabled """
        if self.enable_tracing:
            self.trace.append(CTraceEntry("val", dependency_hash))
            self._taint_tracker.taint("mem")

    def _add_value_to_trace(self, val: int) -> None:
        """ Record the given untyped value, if tracing is enabled """
        if self.enable_tracing:
            self.trace.append(CTraceEntry("val", val))


# ==================================================================================================
# Concrete Tracers
# ==================================================================================================
class NoneTracer(UnicornTracer):
    """
    Tracer that does not record any information.
    Used as a placeholder when a test case has to be executed on the model without tracing.
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        pass

    def observe_instruction(self, pc: int, size: int) -> None:
        pass

    def get_trace(self) -> CTrace:
        return CTrace.empty_trace()


class PCTracer(UnicornTracer):
    """
    Tracer that records the program counter of all instructions executed on the model.

    E.g., if the following program is executed:
        0x0: mov eax, 0x1
        0x4: mov ebx, 0x2
        0x8: mov ecx, 0x3

    The output trace will be [0x0, 0x4, 0x8]
    """

    def observe_instruction(self, pc: int, size: int) -> None:
        self._add_pc_to_trace(pc)
        super().observe_instruction(pc, size)


class MemoryTracer(UnicornTracer):
    """
    Tracer that records the memory addresses accessed by the model.

    E.g., if the following program is executed:
        0x0: mov eax, [0x100]
        0x4: mov ebx, [0x200]
        0x8: mov ecx, [0x300]

    The output trace will be [0x100, 0x200, 0x300]
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        self._add_mem_address_to_trace(address)
        super().observe_mem_access(access, address, size, value)


class L1DTracer(MemoryTracer):
    """
    The same as MemoryTracer, but the traces will be marked as L1D traces; that is, when
    such traces are printed, they will be printed as L1D maps.
    """

    def get_trace(self) -> CTrace:
        trace = super().get_trace()
        trace.set_printed_as_l1d(True)
        return trace


class CTTracer(PCTracer):
    """
    Observe address of the memory access and of the program counter.
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        self._add_mem_address_to_trace(address)
        super().observe_mem_access(access, address, size, value)


class TruncatedCTTracer(UnicornTracer):
    """
    Observe address of the memory access and of the program counter at cache line granularity.
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        self._add_mem_address_to_trace((address >> 6) << 6)
        super().observe_mem_access(access, address, size, value)

    def observe_instruction(self, pc: int, size: int) -> None:
        self._add_pc_to_trace((pc >> 6) << 6)
        super().observe_instruction(pc, size)


class TruncatedCTWithOverflowsTracer(UnicornTracer):
    """
    Observe address of the memory access and of the program counter at cache line granularity +
    observe cache line overflows.
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        self._add_mem_address_to_trace((address >> 6) << 6)
        if (address + size) % 64 != (address % 64):  # add overflows to the trace
            self._add_mem_address_to_trace(((address + size) >> 6) << 6)
        return super().observe_mem_access(access, address, size, value)

    def observe_instruction(self, pc: int, size: int) -> None:
        self._add_pc_to_trace((pc >> 6) << 6)
        if (pc + size) // 64 != (pc // 64):  # add overflows to the trace
            self._add_pc_to_trace(((pc + size) >> 6) << 6)
        return super().observe_instruction(pc, size)


class CTNonSpecStoreTracer(PCTracer):
    """
    Observe address of memory access only if not in speculation or it is a read.
    """

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        # trace all non-spec mem accesses and speculative loads
        if not self._model.speculator.in_speculation() or access == UC_MEM_READ:
            self._add_mem_address_to_trace(address)
        super().observe_mem_access(access, address, size, value)


class ArchTracer(CTTracer):
    """
    Similar to CTTracer, with additional exposure of:
     - Register state at the first memory access
     - The values loaded from memory

    The main use case of this tracer is to model the guarantees provided by secure speculation
    mechanisms, such as Speculative Taint Tracking (STT).
    """
    _started: bool = False

    def reset(self, input_: InputData) -> None:
        super().reset(input_)
        self._started = False

    def observe_instruction(self, pc: int, size: int) -> None:
        # The first instruction must exposes all register values
        if not self._started:
            self._started = True
            for reg in self._uc_target_desc.usable_registers[:-1]:  # exclude stack pointer
                val = self._model.emulator.reg_read(reg)
                assert isinstance(val, int), f"Expected int, got {type(val)}"
                self.trace.append(CTraceEntry("val", val))

        return super().observe_instruction(pc, size)

    def observe_mem_access(self, access: int, address: int, size: int, value: int) -> None:
        if access == UC_MEM_READ:
            val = int.from_bytes(self._model.emulator.mem_read(address, size), byteorder='little')
            self._add_value_to_trace(val)
            self._taint_tracker.taint("ld_val")
        super().observe_mem_access(access, address, size, value)


# ==================================================================================================
# Actor-based Tracers
# ==================================================================================================
class ActorNITracer(CTTracer):
    """
    Tracer that exposes all data that belongs to the actors with `observer` flag set
    + sequential traces for the non-observer actors
    """
    _observer_actor_ids: List[int]

    def __init__(self, target_desc: TargetDesc, model: UnicornModel,
                 taint_tracker: UnicornTaintTracker) -> None:
        super().__init__(target_desc, model, taint_tracker)
        n_observers = len([desc for desc in CONF.get_actors_conf().values() if desc['observer']])
        if n_observers == len(CONF.get_actors_conf()):
            raise ValueError("ActorNITracer requires at least 1 non-observer actor")
        if n_observers == 0:
            raise ValueError("ActorNITracer requires at least 1 observer actor")

    def reset(self, input_: InputData) -> None:
        super().reset(input_)
        assert self._test_case is not None, "Test case not loaded"
        self._observer_actor_ids = [
            actor.get_id() for actor in self._test_case.get_actors() if actor.observer
        ]

    def get_trace(self) -> CTrace:
        ctrace = super().get_trace()
        ctrace = self._add_observer_traces(ctrace)
        self._taint_tracker.taint_actors(self._observer_actor_ids)
        return ctrace

    def _add_observer_traces(self, ctrace: CTrace) -> CTrace:
        assert self._input is not None, "Input not loaded"
        fragment_hashes: List[CTraceEntry] = []
        for actor_id in self._observer_actor_ids:
            input_fragment = self._input[actor_id]
            data = input_fragment.tobytes()
            hash_ = xxhash.xxh64(data, seed=0).intdigest()
            fragment_hashes.append(CTraceEntry("val", hash_))
        new_trace = ctrace.get_typed() + fragment_hashes
        return CTrace(new_trace)


================================================
FILE: rvzr/postprocessing/__init__.py
================================================


================================================
FILE: rvzr/postprocessing/analysis_passes.py
================================================
""" File: Collection of minimization passes that analyse the test case without modifying it.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import TYPE_CHECKING, List
from typing_extensions import assert_never

from ..model_unicorn import model as uc_model, speculators_basic as uc_speculator, \
    tracer as uc_tracer, interpreter as uc_interpreter
from ..sandbox import CodeArea
from ..arch.x86.target_desc import X86TargetDesc
from ..arch.arm64.target_desc import ARM64TargetDesc
from ..config import CONF

from .instruction_passes import BaseInstructionMinimizationPass

if TYPE_CHECKING:
    from ..traces import Violation, CTraceEntry
    from ..tc_components.test_case_data import InputData
    from ..tc_components.test_case_code import TestCaseProgram
    from ..target_desc import TargetDesc


def _get_seq_model(data_start: int, code_start: int) -> uc_model.UnicornModel:
    """
    This is a partial duplicate of the code in factory.py,
    but we cannot import factory.py here due to circular imports.
    """
    model_cls: type[uc_model.UnicornModel]
    target_desc: TargetDesc
    interpreter: type[uc_interpreter.ExtraInterpreter]
    if CONF.instruction_set == "x86-64":
        model_cls = uc_model.X86UnicornModel
        target_desc = X86TargetDesc()
        interpreter = uc_interpreter.X86ExtraInterpreter
    elif CONF.instruction_set == "arm64":
        model_cls = uc_model.ARM64UnicornModel
        target_desc = ARM64TargetDesc()
        interpreter = uc_interpreter.ARMExtraInterpreter
    else:
        assert_never(CONF.instruction_set)

    bases = (data_start, code_start)
    model = model_cls(bases, target_desc, uc_speculator.SeqSpeculator,
                      uc_tracer.CTTracer, interpreter)
    return model


class AddViolationCommentsPass(BaseInstructionMinimizationPass):
    """
    An instrumentation pass that iterates over the test case and adds comments
    with the memory addresses of the loads and stores that caused the violation.
    """
    name = "Violation Comment Insertion"
    violation: Violation

    def set_violation(self, violation: Violation) -> None:
        self.violation = violation

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        # pylint: disable=too-many-locals
        # pylint: disable=too-many-branches
        # FIXME: this function was written in a hurry and needs to be refactored

        # reproduce the violation to get violating input IDs
        v_inputs = [m.input_ for m in self.violation.measurements[:2]]
        v_input_ids = [m.input_id for m in self.violation.measurements[:2]]

        # create a model that will collect PC and memory traces
        data_start, code_start = 0x2000000, 0x1000000
        model = _get_seq_model(data_start, code_start)

        # collect traces
        model.tracer.enable_tracing = True  # start tracing from the very beginning
        model.load_test_case(test_case)
        ctraces_obj = model.trace_test_case(v_inputs, 30)
        ctraces: List[List[CTraceEntry]] = [t.get_typed() for t in ctraces_obj]

        # select loads and stores form the traces
        ctrace_maps = []
        for ctrace in ctraces:
            ctrace_map = {}
            for v1, v2, v3 in zip(ctrace, ctrace[1:], ctrace[2:]):
                if v1.type_ == 'pc' and v2.type_ == 'mem':
                    pc = v1.value
                    ld_addr = v2.value
                    st_addr = v3.value if v3.type_ == 'mem' else 0
                    ctrace_map[pc] = (ld_addr, st_addr)
            ctrace_maps.append(ctrace_map)

        # get the contents of the asm file
        lines = []
        with open(test_case.asm_path(), "r") as f:
            lines = list(enumerate(f))

        # to simplify the next step, get a dictionary mapping assembly lines to PCs
        line_num_to_pc = {}
        for func in test_case.iter_functions():
            actor_id = func.get_owner().get_id()
            actor_start_pc = model.layout.get_code_addr(CodeArea.MAIN, actor_id)
            for bb in func:
                for inst in list(bb) + bb.terminators:
                    pc = actor_start_pc + inst.section_offset() - code_start
                    line_num = inst.line_num()
                    if line_num != 0:
                        line_num_to_pc[line_num] = pc

        # add a comment with the load/store addresses to the assembly
        with open(test_case.asm_path(), 'w') as f:
            for i, line in lines:
                f.write(line)
                if i not in line_num_to_pc:
                    continue
                pc = line_num_to_pc[i]
                if pc not in ctrace_maps[0] or pc not in ctrace_maps[1]:
                    continue

                ld, st, cl, of = [0, 0], [0, 0], [0, 0], [0, 0]
                iid = v_input_ids
                for i in range(2):
                    ld[i], st[i] = ctrace_maps[i][pc]
                    cl[i] = (ld[i] % 0x1000) // 64
                    of[i] = (ld[i] % 0x1000) % 64

                if st[0] != 0 or st[1] != 0:
                    f.write(
                        f"{self._comment_symbol} "
                        f"mem access: [{iid[0]}] {hex(ld[0])}-{hex(st[0])} CL {cl[0]}:{of[0]} | "
                        f"[{iid[1]}] {hex(ld[1])}-{hex(st[1])} CL {cl[1]}:{of[1]}\n")
                else:
                    f.write(f"{self._comment_symbol} "
                            f"mem access: [{iid[0]}] {hex(ld[0])} CL {cl[0]}:{of[0]} | "
                            f"[{iid[1]}] {hex(ld[1])} CL {cl[1]}:{of[1]}\n")

                if st[0] == 0xff8 or st[1] == 0xff8:
                    f.write(f"{self._comment_symbol} exception?\n")

        return test_case

    def modify_instruction(self, _: List[str], __: int) -> List[str]:
        return []  # unused

    def verify_modification(self, _: TestCaseProgram, __: List[InputData]) -> bool:
        return True  # unused


================================================
FILE: rvzr/postprocessing/input_passes.py
================================================
"""
File: Collection of minimization passes that operate on the test case input data.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import abc
from copy import deepcopy
from math import log2

from typing import TYPE_CHECKING, List, Final, Optional, Tuple

from .pass_abc import BaseMinimizationPass
from ..config import CONF

if TYPE_CHECKING:
    from ..traces import Violation
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.test_case_data import InputData

_PER_ACTOR_INPUT_SIZE: Final[int] = 0x4000  # 16 KB per actor
_PRINT_BLOCK_SIZE: Final[int] = 8  # print progress indicator in 8-byte blocks
_PRINT_LINE_SIZE: Final[int] = 64  # print progress indicator in (64 * 8)-byte lines
_MAX_BLOCK_SIZE: Final[int] = 64  # try to zero out up to 64 bytes at once


class BaseInputMinimizationPass(BaseMinimizationPass):
    """ Base class for a minimization pass that operates on inputs. """

    @abc.abstractmethod
    def run(self, test_case: TestCaseProgram, org_inputs: List[InputData],
            org_violation: Violation) -> List[InputData]:
        """ Main function that runs the minimization pass
        :param test_case: The test case object to work on
        :param org_inputs: List of inputs to minimize
        :param org_violation: The original violation
        :return: List of minimized inputs
        """


class InputSequenceMinimizationPass(BaseInputMinimizationPass):
    """
    A minimization pass that iteratively removes inputs from the violating the input sequence
    and checks if the violation is still triggered.
    """
    name = "Input Sequence Minimization"

    def run(self, test_case: TestCaseProgram, org_inputs: List[InputData],
            org_violation: Violation) -> List[InputData]:
        self._progress.pass_msg("Reducing the number of inputs by halving")
        org_len = len(org_inputs)

        violation = org_violation
        nonboosted_inputs = org_inputs
        while len(nonboosted_inputs) > 5:
            new_inputs = nonboosted_inputs[:len(nonboosted_inputs) // 2]
            new_violation = self._fuzzer.fuzzing_round(test_case, new_inputs, [])
            if not new_violation:
                break
            nonboosted_inputs = new_inputs
            violation = new_violation

        if len(nonboosted_inputs) < org_len:
            self._progress.pass_msg(f"Result: Reduced to {len(nonboosted_inputs)} inputs")
        else:
            self._progress.pass_msg("Result: Could not reduce the number of inputs")

        # Get boosted inputs and disable boosting from now on
        inputs = violation.input_sequence
        org_ipc = CONF.inputs_per_class
        CONF.inputs_per_class = 1  # disable boosting from now on

        n_iterations = 10
        self._progress.pass_msg("Reducing the input sequence iteratively")
        for iteration in range(n_iterations):
            self._progress.pass_msg(f"Iteration {iteration + 1}")
            org_len = len(inputs)
            for input_id in range(org_len, 0, -1):
                new_inputs = inputs[0:input_id] + inputs[input_id + 1:]
                new_violation = self._fuzzer.fuzzing_round(test_case, new_inputs, [])
                if not new_violation:
                    self._progress.next(False)
                    continue
                self._progress.next(True)
                inputs = new_inputs
                violation = new_violation
            self._progress.pass_finish()
            if len(inputs) == org_len:
                break
        self._progress.pass_msg(f"Result: Reduced to {len(inputs)} inputs")
        CONF.inputs_per_class = org_ipc
        return violation.input_sequence


class DifferentialInputMinimizerPass(BaseInputMinimizationPass):
    """
    A minimization pass that iteratively minimizes the difference between two violating inputs.
    It tries to zero out blocks of decreasing size and checks if the violation is still triggered.
    If this is not possible, it tries to copy the byte between the two inputs.
    """
    name = "Differential Input Minimizer"

    _test_case: Optional[TestCaseProgram] = None
    _inputs: Optional[List[InputData]] = None
    _violating_ids: Optional[Tuple[int, int]] = None
    _local_ignore_list: List[int] = []
    _leaked_addresses: List[int] = []

    def run(self, test_case: TestCaseProgram, _: List[InputData],
            org_violation: Violation) -> List[InputData]:

        # Set the context for this pass
        self._set_pass_context(test_case, org_violation)
        assert self._violating_ids is not None
        self._progress.pass_msg("Minimizing the difference between inputs"
                                f" {self._violating_ids[0]} and {self._violating_ids[1]}")

        # Disable boosting for this pass as we already operate on the boosted inputs
        org_conf = (CONF.inputs_per_class,)
        CONF.inputs_per_class = 1

        # Print header for progress output
        print(f'\n{"Address":<11}', end="", flush=True)
        for i in range(0, 64, 8):
            print(f"+0x{i * 8:<6x}", end="", flush=True)

        # Start the pass
        for actor_id in range(len(CONF.get_actors_conf())):
            self._process_actor(actor_id)
        print("")

        # Print summary
        self._progress.pass_msg(f"Result: Leaked {len(self._leaked_addresses)} bytes")
        self._progress.pass_msg(f"Addresses: {[hex(addr) for addr in self._leaked_addresses]}")

        # Restore original configuration
        assert self._inputs is not None
        new_inputs = list(self._inputs)
        CONF.inputs_per_class = org_conf[0]
        self._reset_pass_context()

        return new_inputs

    def _set_pass_context(self, test_case: TestCaseProgram, org_violation: Violation) -> None:
        """
        Set the context for the minimization pass.
        :param test_case: The test case object to work on
        :param org_violation: The original violation
        :return: None
        """
        # Store the test case and inputs
        self._test_case = test_case
        self._inputs = org_violation.input_sequence

        # For convenience, also store the two inputs to minimize
        violating_input_ids = [i.input_id for i in org_violation.measurements]
        if len(violating_input_ids) > 2:
            violating_input_ids = violating_input_ids[:2]
        self._violating_ids = (violating_input_ids[0], violating_input_ids[1])

        # Store a list of all other input IDs, which we will ignore during checks
        self._local_ignore_list = [
            i for i in range(len(self._inputs)) if i not in violating_input_ids
        ]

        # Finally, make a list to store all leaked addresses
        self._leaked_addresses = []

    def _reset_pass_context(self) -> None:
        """ Reset the context for the minimization pass. """
        self._test_case = None
        self._inputs = None
        self._local_ignore_list = []
        self._leaked_addresses = []

    def _process_actor(self, actor_id: int) -> None:
        """
        Process the input regions of a single actor.
        :param actor_id: The actor ID
        """
        assert self._inputs is not None and self._violating_ids is not None

        # Process all input regions of the actor
        region_offset = 0
        for region_name in ['main', 'faulty', 'gpr', 'simd']:
            region_size = len(self._inputs[self._violating_ids[0]][actor_id][region_name])

            # Within each region, process all bytes
            i = 0
            while i < region_size:
                absolute_address = actor_id * _PER_ACTOR_INPUT_SIZE + region_offset + i * 8

                # Periodically break lines and print spaces for better readability
                if i % _PRINT_LINE_SIZE == 0:
                    print(f"\n0x{absolute_address:08x} ", end="", flush=True)
                elif i % _PRINT_BLOCK_SIZE == 0:
                    print(" ", end="", flush=True)

                # Process the block starting at the current index
                processed_block_size = self._process_block(actor_id, region_name, i, region_size,
                                                           absolute_address)
                i += processed_block_size

            region_offset += region_size * 8

    def _process_block(self, actor_id: int, region_name: str, block_start: int, region_size: int,
                       absolute_address: int) -> int:
        """
        Try to minimize the difference between the two inputs at the given index.
        """
        assert self._test_case is not None and self._inputs is not None \
               and self._violating_ids is not None
        input_a = self._inputs[self._violating_ids[0]]
        input_b = self._inputs[self._violating_ids[1]]
        org_input_a = deepcopy(input_a)
        org_input_b = deepcopy(input_b)

        def _restore_addr(addr: int) -> None:
            input_a[actor_id][region_name][addr] = org_input_a[actor_id][region_name][addr]
            input_b[actor_id][region_name][addr] = org_input_b[actor_id][region_name][addr]

        def _zero_out_block(addr: int) -> int:
            """
            Try to zero out a block of memory and check if the violation is still triggered.
            Start with the largest possible block size and iteratively decrease the block size
            until violation is triggered or the block size is 1.
            :return: The size of the block that was successfully zeroed out, or 1
            """
            assert input_a is not None and input_b is not None and \
                self._test_case is not None and self._inputs is not None

            # Find a suitable starting block size, fulfilling the following criteria:
            #    * the block size is less then 512 bytes (64 * 8)
            block_size: int = _MAX_BLOCK_SIZE - (addr % _MAX_BLOCK_SIZE)
            #    * the block does not overlap with the next region
            block_size = min(block_size, region_size - addr)
            #    * the block size is a power of 2
            block_size = 2**int(log2(block_size))
            #    * i mod block_size == 0
            while block_size > 1 and addr % block_size != 0:
                block_size //= 2

            # Starting from the determined block size, try to find the largest block
            # such that zeroing out the block still triggers the violation
            while block_size > 1:
                # Try zeroing out the block
                for i in range(block_size):
                    input_a[actor_id][region_name][addr + i] = 0
                    input_b[actor_id][region_name][addr + i] = 0

                # Check if the violation is still triggered
                if self._check_for_violation(self._test_case, self._inputs,
                                             self._local_ignore_list):
                    # If reproduced, we managed to zero out the block; return
                    return block_size

                # If not reproduced, restore the original values and try a smaller block
                for i in range(block_size):
                    _restore_addr(addr + i)
                block_size //= 2

            # If we reach here, we could not zero out a block larger than 1 byte
            return 1

        # First, try setting a large block of bytes to zero
        block_size = _zero_out_block(block_start)
        if block_size > 1:
            # If reproduced, print progress and return the block size
            n_64byte_blocks = block_size // 8
            n_remainder_bytes = block_size % 8
            if n_remainder_bytes > 0:
                print("." * n_remainder_bytes, end="", flush=True)
                if n_64byte_blocks > 0:
                    print(" ", end="", flush=True)
            if n_64byte_blocks > 0:
                print(("." * 8 + " ") * (n_64byte_blocks - 1), end="", flush=True)
                print("." * 8, end="", flush=True)
            return block_size

        # try zeroing out a single byte
        input_a[actor_id][region_name][block_start] = 0
        input_b[actor_id][region_name][block_start] = 0
        if self._check_for_violation(self._test_case, self._inputs, self._local_ignore_list):
            print(".", end="", flush=True)
            return 1
        _restore_addr(block_start)

        # check if the bytes are already equal; if so, nothing more to do here
        if input_a[actor_id][region_name][block_start] == \
           input_b[actor_id][region_name][block_start]:
            print("=", end="", flush=True)
            return 1

        # try copying the byte between the two inputs
        input_a[actor_id][region_name][block_start] = \
            org_input_a[actor_id][region_name][block_start]
        input_b[actor_id][region_name][block_start] = \
            input_a[actor_id][region_name][block_start]
        if self._check_for_violation(self._test_case, self._inputs, self._local_ignore_list):
            print("+", end="", flush=True)
            return 1
        _restore_addr(block_start)

        # if failing, we found a leaked address
        print("^", end="", flush=True)
        self._leaked_addresses.append(absolute_address)
        return 1


================================================
FILE: rvzr/postprocessing/instruction_passes.py
================================================
""" File: Collection of minimization passes that operate on instructions
    (i.e., simplify test case code).

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import abc
import os
import re
from subprocess import run
from typing import TYPE_CHECKING, List, Dict, Callable
from typing_extensions import assert_never

from .pass_abc import BaseMinimizationPass
from ..logs import warning
from ..config import CONF

if TYPE_CHECKING:
    from ..traces import Violation
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.test_case_data import InputData
    from ..fuzzer import Fuzzer
    from ..isa_spec import InstructionSet
    from ..postprocessing.progress_printer import ProgressPrinter


class BaseInstructionMinimizationPass(BaseMinimizationPass):
    """
    Base class for a minimization pass that operates on instructions.
    """
    name: str = ""

    # ------------------------------------------------
    # Abstract interface
    @abc.abstractmethod
    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        """ Main function that runs the minimization pass """

    @abc.abstractmethod
    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        """
        Modify the instruction at the given cursor according to
        the algorithm defined by subclass
        """

    @abc.abstractmethod
    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        """
        Verify if the modification made to the test case is valid according to
        the algorithm defined by subclass
        """

    def minimization_loop(self,
                          test_case: TestCaseProgram,
                          inputs: List[InputData],
                          skip_instrumentation_lines: bool = True) -> List[int]:
        """
        Standard minimization loop that iteratively applies the modification
        algorithm (modify_instruction) to each line of the test case and checks if the resulting
        test case still passes the verification function (verify_modification).

        :param test_case: The test case object to minimize
        :param inputs: List of inputs to use for verification
        :param skip_instrumentation_lines: If True, skip lines with the `instrumentation` comment
        :return List of instruction IDs that passed the verification
        """

        def line_is_skipped(line: str) -> bool:
            if not line:
                return True
            # We skip lines that meet the following criteria:
            is_skipped = line == ""  # empty line
            is_skipped |= (line[0] == self._comment_symbol)  # comment
            is_skipped |= ("lfence" in line)  # fences
            is_skipped |= ('.' == line[0])  # labels
            is_skipped |= ('noremove' in line)  # explicitly marked as non-removable
            is_skipped |= (skip_instrumentation_lines and 'instrumentation' in line)
            is_skipped |= (self._base_register in line and '[' not in line)  # sandbox updates
            return is_skipped

        # get all lines of the test case
        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()

        # Iterate over all instructions, backwards, and collect a list of instructions that
        # can be modified while still passing the verification
        cursor = len(instructions)
        modifiable_ids = []
        while True:
            cursor -= 1
            line = instructions[cursor].strip().lower()
            # Check if we are done
            if cursor == 0:
                break

            # Leave certain lines untouched
            if line_is_skipped(line):
                continue

            # Create a modified test case
            modified_instructions = self.modify_instruction(instructions, cursor)
            if not modified_instructions:  # skip line if the modification failed
                self._progress.next(False)
                continue

            # Create a test case object from the modified instructions
            tmp_test_case = self._get_test_case_from_instructions(modified_instructions)

            # Verify modification and update the list of modifiable instructions
            check_passed = self.verify_modification(tmp_test_case, inputs)
            if check_passed:
                self._progress.next(True)
                instructions = modified_instructions
                modifiable_ids.append(cursor)
            else:
                self._progress.next(False)

        return modifiable_ids

    def set_violation(self, violation: Violation) -> None:
        """ Set the violation that is being minimized """


class InstructionRemovalPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively removes instructions from the test case
    (one at a time, starting from the end) and checks if the violation is still triggered.
    """
    name = "Instruction Removal Pass"

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        modifiable_ids = self.minimization_loop(test_case, inputs)
        self._progress.pass_finish()

        instructions: List[str] = []
        with open(test_case.asm_path(), "r") as f:
            for i, line in enumerate(f):
                if i in modifiable_ids:
                    # This instruction could be removed.
                    # Additionally, clear the instrumentation tag from the previous line
                    if "instrumentation" in instructions[-1].lower():
                        instructions[-1] = instructions[-1].replace("instrumentation", "")
                else:
                    # This instruction is essential for the violation; keep it
                    instructions.append(line)

        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        return instructions[:cursor] + instructions[cursor + 1:]

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


class InstructionSimplificationPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively replaces instructions with simpler ones
    (e.g., `cmov` with `mov`, `add` with `mov`, etc.) and checks
    if the violation is still triggered.
    """
    name = "Instruction Simplification Pass"

    _instruction_replacements: Dict[str, Callable[[str], str]] = {
        "cmova": lambda _: "mov",
        "cmovae": lambda _: "mov",
        "cmovb": lambda _: "mov",
        "cmovbe": lambda _: "mov",
        "cmovc": lambda _: "mov",
        "cmove": lambda _: "mov",
        "cmovg": lambda _: "mov",
        "cmovge": lambda _: "mov",
        "cmovl": lambda _: "mov",
        "cmovle": lambda _: "mov",
        "cmovna": lambda _: "mov",
        "cmovnae": lambda _: "mov",
        "cmovnb": lambda _: "mov",
        "cmovnbe": lambda _: "mov",
        "cmovnc": lambda _: "mov",
        "cmovne": lambda _: "mov",
        "cmovng": lambda _: "mov",
        "cmovnge": lambda _: "mov",
        "cmovnl": lambda _: "mov",
        "cmovnle": lambda _: "mov",
        "cmovno": lambda _: "mov",
        "cmovnp": lambda _: "mov",
        "cmovns": lambda _: "mov",
        "cmovnz": lambda _: "mov",
        "cmovo": lambda _: "mov",
        "cmovp": lambda _: "mov",
        "cmovs": lambda _: "mov",
        "cmovz": lambda _: "mov",
        "xchg": lambda _: "mov",
        "cmpxchg": lambda _: "xchg",
        "rep": lambda _: "",
        "lock": lambda _: "",
        "add": lambda _: "mov",
        "sub": lambda _: "add",
        "or": lambda _: "add",
        "xor": lambda _: "add",
        "and": lambda _: "add",
        "cmp": lambda _: "add",
        "bsr": lambda _: "add",
        "bsf": lambda _: "add",
        "bt": lambda _: "add",
        "bts": lambda _: "add",
        "btr": lambda _: "add",
        "btc": lambda _: "add",
        "bzhi": lambda _: "add",
        "bextr": lambda _: "add",
        "blsi": lambda _: "add",
        "blsmsk": lambda _: "add",
        "xadd": lambda _: "add",
        "test": lambda _: "add",
        "adc": lambda _: "add",
        "sbb": lambda _: "sub",
        "mul": lambda _: "inc",
        "div": lambda _: "inc",
        "setb": lambda _: "inc",
        "not": lambda _: "inc",
        "idiv": lambda _: "div",
        "imul": lambda line: "add" if len(line.split(",")) == 2 else "imul",
    }

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        if CONF.instruction_set == "arm64":
            warning("postprocessor", "--enable-simplification-pass has no effect on ARM64")
            return test_case

        inst_ids = self.minimization_loop(test_case, inputs)
        self._progress.pass_finish()

        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()
        for i in inst_ids:
            instructions = self.modify_instruction(instructions, i)
        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        tmp = list(instructions)  # make a copy
        clean_line = tmp[cursor].strip().lower()
        words = clean_line.split(" ")
        key = words[0]
        replacement_func = self._instruction_replacements.get(key, None)
        if not replacement_func:
            return []
        tmp[cursor] = " ".join([replacement_func(clean_line)] + words[1:]) + "\n"

        return tmp

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


class ConstantSimplificationPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively replaces constants in the test case with zeros
    and checks if the violation is still triggered.
    """
    name = "Constant Simplification Pass"

    def __init__(self, fuzzer: Fuzzer, instruction_set_spec: InstructionSet,
                 progress: ProgressPrinter):
        super().__init__(fuzzer, instruction_set_spec, progress)
        if CONF.instruction_set == "x86-64":
            self._match_dec = re.compile(r"^-?[0-9]+$")
            self._match_hex = re.compile(r"^-?0x[0-9a-f]+$")
            self._match_bin = re.compile(r"^-?0b[01]+$")
            self._replacement = "0"
        elif CONF.instruction_set == "arm64":
            self._match_dec = re.compile(r"^#-?[0-9]+$")
            self._match_hex = re.compile(r"^#-?0x[0-9a-f]+$")
            self._match_bin = re.compile(r"^#-?0b[01]+$")
            self._replacement = "#1"  # this value is safe as both an immediate and a bitmask
        else:
            assert_never(CONF.instruction_set)

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        inst_ids = self.minimization_loop(test_case, inputs)
        self._progress.pass_finish()

        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()
        for i in inst_ids:
            instructions = self.modify_instruction(instructions, i)
        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        tmp = list(instructions)  # make a copy
        clean_line = tmp[cursor].strip().lower()
        words = clean_line.split(",")
        for word_id, word in enumerate(words):
            word = word.strip()
            if word == self._replacement:  # already replaced
                break
            if self._match_dec.match(word) or self._match_hex.match(word) \
               or self._match_bin.match(word):
                tmp[cursor] = ", ".join(words[:word_id] + [self._replacement]
                                        + words[word_id + 1:]) + "\n"
                return tmp
        return []

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


class MaskSimplificationPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively replaces masks of the instrumentation
    instructions with smaller masks and checks if the violation is still triggered.
    E.g., `and rax, 0b1111111111111` -> `and rax, 0b1111111111110`
    """
    name = "Mask Simplification Pass"

    _mask_replacements = {
        "0b1111111111111": "0b1111111111110",
        "0b1111111111110": "0b1111111111100",
        "0b1111111111100": "0b1111111111000",
        "0b1111111111000": "0b1111111110000",
        "0b1111111110000": "0b1111111100000",
        "0b1111111100000": "0b1111111000000",
        "0b1111111000000": "0b1111110000000",
        "0b1111110000000": "0b1111100000000",
        "0b1111100000000": "0b1111000000000",
        "0b1111000000000": "0b1110000000000",
        "0b1110000000000": "0b1100000000000",
        "0b1100000000000": "0b1000000000000",
        "0b1000000000000": "0b0000000000000",
    }

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        inst_ids = self.minimization_loop(test_case, inputs, skip_instrumentation_lines=False)
        self._progress.pass_finish()

        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()
        for i in inst_ids:
            instructions = self.modify_instruction(instructions, i)
        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        tmp = list(instructions)  # make a copy

        comment_split = tmp[cursor].split(self._comment_symbol)
        clean_line = comment_split[0].strip().lower()
        comment = self._comment_symbol.join(comment_split[1:]) if len(comment_split) > 1 else ""

        words = clean_line.split(",")
        for word_id, word in enumerate(words):
            word = word.strip()
            replacement = self._mask_replacements.get(word, None)
            if replacement:
                tmp[cursor] = ", ".join(words[:word_id] + [replacement] + words[word_id + 1:]) \
                    + " " + self._comment_symbol + comment
                return tmp

        return []

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


class NopReplacementPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively replaces instructions with NOPs
    of the same size and checks if the violation is still triggered.
    """
    name = "NOP Replacement Pass"

    _replacements_x86 = {
        1: "nop  # 1 B",
        2: ".byte 0x66, 0x90  # 2 B",
        3: "nop dword ptr [rax]  # 3 B",
        4: "nop qword ptr [rax]  # 4 B",
        5: "nop qword ptr [rax + 1]  # 5 B",
        6: "nop qword ptr [rax + rax + 1]  # 6 B",
        7: "nop dword ptr [rax + 0xff]  # 7 B",
        8: "nop qword ptr [rax + 0xff]  # 8 B",
        9: "nop qword ptr [rax + rax + 0xff]  # 9 B",
    }
    _replacements_arm64 = {
        4: "nop",  # all instructions are 4 bytes
    }

    def __init__(self, fuzzer: Fuzzer, instruction_set_spec: InstructionSet,
                 progress: ProgressPrinter):
        super().__init__(fuzzer, instruction_set_spec, progress)
        if CONF.instruction_set == "x86-64":
            self._replacements = self._replacements_x86
        elif CONF.instruction_set == "arm64":
            self._replacements = self._replacements_arm64
        else:
            assert_never(CONF.instruction_set)

        self._match_jump = re.compile(r"^j[a-z]* .*") if CONF.instruction_set == "x86-64" else \
            re.compile(r"^b\.[a-z]* .*|^bl[a-z]* .*")
        self._match_loop = re.compile(r"^loop[a-z]* .*") if CONF.instruction_set == "x86-64" else \
            re.compile(r"^cbz .*|^cbnz .*|^tbnz .*|^tbz .*")

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        modified_ids = self.minimization_loop(test_case, inputs, skip_instrumentation_lines=True)
        self._progress.pass_finish()

        with open(test_case.asm_path(), "r") as f:
            lines = f.readlines()

        instructions = []
        for i, line in enumerate(lines):
            # skip non-modifiable lines
            if i not in modified_ids:
                instructions.append(line)
                continue

            # get the NOP replacement
            replacement = self.modify_instruction([line], 0)
            if not replacement:
                warning("postprocessor", f"Inconsistent NOP output: {line}")
                instructions.append(line)
                continue

            # This instruction could be replaced with a NOP
            instructions.append(replacement[0])

            # And the instrumentation tag from the previous line can be cleared
            if "instrumentation" in instructions[-2].lower():
                instructions[-2] = instructions[-2].replace("instrumentation", "")

        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        tmp = list(instructions)  # make a copy

        line = tmp[cursor].strip().lower()
        if "nop" in line:
            return []

        # skip jumps as replacing them with nops will confuse our assembly parser
        if self._match_jump.match(line) or self._match_loop.match(line):
            return []

        # determine the instruction size
        with open("tmp.asm", "w") as f:
            if CONF.instruction_set == "x86-64":
                f.write(".intel_syntax noprefix\n")
            f.write(line)
            f.write("\n")
        run("as tmp.asm -o tmp.o", shell=True, check=True)
        run("objcopy -O binary --only-section=.text tmp.o tmp.o", shell=True, check=True)
        size = os.path.getsize("tmp.o")
        os.remove("tmp.asm")
        os.remove("tmp.o")

        if size not in self._replacements:
            return []

        tmp[cursor] = self._replacements[size] + "\n"
        return tmp

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


class LabelRemovalPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively removes unused labels from the test case.
    Note that no verification is performed in this pass as labels are not executed.
    """
    name = "Label Removal Pass"
    _reserved = [
        ".intel_syntax noprefix", ".test_case_exit:", ".section", ".function", ".macro", "syntax"
    ]

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()
            n_instructions = len(instructions)

        for i in range(n_instructions):
            line = instructions[i].strip().lower()

            # skip non-labels
            if not line.startswith("."):
                self._progress.next(False)
                continue

            # skip reserved labels
            if any(reserved in line for reserved in self._reserved):
                continue

            # check if the label is used by other instructions
            label = instructions[i].strip().replace(":", "")
            used = False
            for inst in instructions:
                if label in inst and inst != instructions[i]:
                    used = True
                    break

            # remove unused labels
            if not used:
                self._progress.next(True)
                instructions[i] = ""
            else:
                self._progress.next(False)

        self._progress.pass_finish()
        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        return []  # unused

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return True  # unused


class FenceInsertionPass(BaseInstructionMinimizationPass):
    """
    A minimization pass that iteratively inserts LFENCE instructions before each instruction
    and checks if the violation is still triggered.
    """
    name = "Fence Insertion Pass"

    def __init__(self, fuzzer: Fuzzer, instruction_set_spec: InstructionSet,
                 progress: ProgressPrinter):
        super().__init__(fuzzer, instruction_set_spec, progress)
        self._match_jump = re.compile(r"^j[a-z]* .*") if CONF.instruction_set == "x86-64" else \
            re.compile(r"^b\.[a-z]* .*|^bl[a-z]* .*")
        self._match_loop = re.compile(r"^loop[a-z]* .*") if CONF.instruction_set == "x86-64" else \
            re.compile(r"^cbz .*|^cbnz .*|^tbnz .*|^tbz .*")
        self._fence = "lfence" if CONF.instruction_set == "x86-64" else "dsb sy\n isb"

    def run(self, test_case: TestCaseProgram, inputs: List[InputData]) -> TestCaseProgram:
        inst_ids = self.minimization_loop(test_case, inputs)
        self._progress.pass_finish()

        with open(test_case.asm_path(), "r") as f:
            instructions = f.readlines()
        for i in inst_ids:
            instructions = instructions[:i] + [self._fence + "\n"] + instructions[i:]
        return self._get_test_case_from_instructions(instructions)

    def modify_instruction(self, instructions: List[str], cursor: int) -> List[str]:
        curr_instr = instructions[cursor].lower()
        if self._match_jump.match(curr_instr) or self._match_loop.match(curr_instr):
            return []  # skip control-flow instructions - their target is already fenced
        return instructions[:cursor] + [self._fence + "\n"] + instructions[cursor:]

    def verify_modification(self, test_case: TestCaseProgram, inputs: List[InputData]) -> bool:
        return self._check_for_violation(test_case, inputs, self._ignore_list)


================================================
FILE: rvzr/postprocessing/minimizer.py
================================================
""" File: Entry point for the postprocessing module.
    It selects the appropriate minimization passes based on the command-line arguments,
    and then runs them.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
import shutil
import os

from copy import deepcopy
from typing import List, NamedTuple, Dict, TYPE_CHECKING, Any, Type, Optional
from ..traces import Violation
from ..tc_components.test_case_code import TestCaseProgram
from ..tc_components.test_case_data import InputData
from ..config import CONF
from ..logs import warning, error, update_logging_after_config_change
from ..fuzzer import Fuzzer

from .instruction_passes import BaseInstructionMinimizationPass, InstructionRemovalPass, \
    InstructionSimplificationPass, NopReplacementPass, ConstantSimplificationPass, \
    MaskSimplificationPass, LabelRemovalPass, FenceInsertionPass
from .input_passes import BaseInputMinimizationPass, InputSequenceMinimizationPass, \
    DifferentialInputMinimizerPass
from .analysis_passes import AddViolationCommentsPass
from .progress_printer import ProgressPrinter

if TYPE_CHECKING:
    from ..isa_spec import InstructionSet

TMP_DIR = "/tmp/rvzr_minimize"


class PassDesc(NamedTuple):
    """ A named tuple to store the minimization pass description """
    cls_: Type[BaseInstructionMinimizationPass | BaseInputMinimizationPass]
    is_analysis_pass: bool


class Minimizer:
    """
    Main class for the postprocessing module. It selects the appropriate minimization passes
    based on the command-line arguments, and then runs them.
    """

    ignore_list: List[int]
    """ List of input IDs that will be ignored during minimization """

    pass_map: Dict[str, PassDesc]
    """ Mapping of pass names to their classes """

    _instruction_passes: List[Type[BaseInstructionMinimizationPass]]
    _input_passes: List[Type[BaseInputMinimizationPass]]
    _analysis_passes: List[Type[BaseInstructionMinimizationPass]]

    def __init__(self, fuzzer: Fuzzer, instruction_set_spec: InstructionSet):
        self._fuzzer = fuzzer
        self._progress = ProgressPrinter()
        self.instruction_set_spec = instruction_set_spec
        self.ignore_list = []

        # manage tmp directory
        if not os.path.exists(TMP_DIR):
            os.makedirs(TMP_DIR)

        # initialize the pass map
        self.pass_map = {
            "instruction_pass": PassDesc(InstructionRemovalPass, False),
            "simplification_pass": PassDesc(InstructionSimplificationPass, False),
            "nop_pass": PassDesc(NopReplacementPass, False),
            "constant_pass": PassDesc(ConstantSimplificationPass, False),
            "mask_pass": PassDesc(MaskSimplificationPass, False),
            "label_pass": PassDesc(LabelRemovalPass, False),
            "fence_pass": PassDesc(FenceInsertionPass, True),
            "input_seq_pass": PassDesc(InputSequenceMinimizationPass, False),
            "input_diff_pass": PassDesc(DifferentialInputMinimizerPass, False),
            "comment_pass": PassDesc(AddViolationCommentsPass, True),
        }

    def __del__(self) -> None:
        # remove tmp directory
        if os.path.exists(TMP_DIR):
            shutil.rmtree(TMP_DIR)

    def run(self, test_case_asm: str, n_inputs: int, test_case_outfile: str, input_outdir: str,
            n_attempts: int, **enabled_passes: Any) -> None:
        """
        Run the minimization passes based on the command-line arguments, passed as arguments
        to this function. It first reproduces the violation, then run input passes,
        then instruction passes, and finally the analysis passes. The resulting minimized program
        is stored into `test_case_outfile` and the resulting minimized input sequence is stored
        into `input_outdir`.

        :param test_case_asm: Path to the test case assembly file
        :param n_inputs: Number of inputs to use during the minimization
        :param test_case_outfile: Path to store the minimized test case
        :param input_outdir: Path to store the minimized inputs
        :param n_attempts: Number of attempts to run the instruction minimization passes
        :param enabled_passes: Dictionary of arguments to enable/disable the passes.
               Supported keys:
               - enable_instruction_pass
               - enable_simplification_pass
               - enable_nop_pass
               - enable_constant_pass
               - enable_mask_pass
               - enable_label_pass
               - enable_fence_pass
               - enable_input_seq_pass
               - enable_input_diff_pass
               - enable_comment_pass
        :return: None
        """
        self._reset(enabled_passes)

        # Parse the test case and inputs
        test_case = self._fuzzer.asm_parser.parse_file(test_case_asm, self._fuzzer.code_gen,
                                                       self._fuzzer.elf_parser)
        inputs = self._fuzzer.data_gen.generate(n_inputs, n_actors=test_case.n_actors())

        # Check if the violation can be reproduced
        violation = self._reproduce_org_violation(test_case, inputs)
        if not violation:
            return

        # Run the input minimization passes
        if self._input_passes:
            new_inputs = self._run_input_passes(test_case, inputs, violation, input_outdir)

            # Check if the violation can be reproduced with the new inputs
            new_violation = self._fuzzer.fuzzing_round(test_case, inputs, [])
            if new_violation:
                # Use new inputs in future passes
                inputs = new_inputs
                violation = new_violation

                # Disable boosting from now on:
                # The minimized input sequence is now guaranteed to be boosted
                CONF.inputs_per_class = 1
            else:
                warning("postprocessor", "Non-reproducible input sequence minimization. Reverting")

        # Set the non-violating inputs as the ignore list
        violating_ids = [m.input_id for m in violation.measurements]
        self.ignore_list = \
            [i for i in range(len(violation.input_sequence)) if i not in violating_ids]
        self._progress.pass_msg(f"Violating input IDs: {violating_ids}")

        # Run the instruction minimization passes
        for attempt in range(n_attempts):
            self._progress.global_msg(f"Minimization attempt {attempt + 1}/{n_attempts}")
            old_tc = deepcopy(test_case)
            test_case = self._run_instruction_passes(test_case, inputs, violation,
                                                     test_case_outfile)
            if test_case == old_tc:  # break if no progress was made
                break

        # Run the analysis passes
        test_case = self._run_analysis_passes(test_case, inputs, violation, test_case_outfile)

        # Get rid of unused labels
        if enabled_passes.get("enable_label_pass", False):
            self._instruction_passes = [LabelRemovalPass]
            test_case = self._run_instruction_passes(test_case, inputs, violation,
                                                     test_case_outfile)

        # Store the results
        self._progress.pass_start("Storing the results")
        test_case.save(test_case_outfile)

    def _reset(self, enabled_passes: Dict[str, Any]) -> None:
        # Get lists of enabled passes
        self._set_passes(enabled_passes)

        # Reset the ignore list
        self.ignore_list = []

        # Adjust the sample size to reduce non-reproducibility
        CONF.executor_sample_sizes = [CONF.executor_sample_sizes[-1]]

        # Make sure that fuzzing progress is not printed
        if "info" in CONF.logging_modes:
            CONF.logging_modes.remove("info")
            update_logging_after_config_change()

    def _reproduce_org_violation(self, test_case: TestCaseProgram,
                                 inputs: List[InputData]) -> Optional[Violation]:
        self._progress.pass_start("Reproducing the violation")
        for _ in range(CONF.minimizer_retries):
            violation = self._fuzzer.fuzzing_round(test_case, inputs, [])
            if violation:
                self._progress.pass_msg("Violation reproduced. Proceeding with minimization")
                return violation
        self._progress.pass_msg("Could not reproduce the violation. Exiting")
        return None

    def _set_passes(self, enabled_passes: Dict[str, Any]) -> None:
        passes: List[PassDesc] = \
            [v for k, v in self.pass_map.items() if enabled_passes.get(f"enable_{k}", False)]
        self._input_passes = [
            p.cls_ for p in passes if issubclass(p.cls_, BaseInputMinimizationPass)
        ]
        self._instruction_passes = [
            p.cls_
            for p in passes
            if issubclass(p.cls_, BaseInstructionMinimizationPass) and not p.is_analysis_pass
        ]
        self._analysis_passes = [
            p.cls_
            for p in passes
            if issubclass(p.cls_, BaseInstructionMinimizationPass) and p.is_analysis_pass
        ]

    def _run_input_passes(self, test_case: TestCaseProgram, inputs: List[InputData],
                          org_violation: Violation, outdir: str) -> List[InputData]:
        violation = org_violation

        for pass_cls in self._input_passes:
            # Create the pass object
            pass_ = pass_cls(self._fuzzer, self.instruction_set_spec, self._progress)
            self._progress.pass_start(pass_.name)

            # Run the pass
            new_inputs = pass_.run(test_case, inputs, violation)

            # Recreate the violation with the new input sequence
            new_violation = self._fuzzer.fuzzing_round(test_case, new_inputs, [])
            if new_violation:
                violation = new_violation
                inputs = new_inputs
            else:
                self._progress.pass_msg("[WARNING] Non-reproducible sequence minimization"
                                        ". Rolling back to the previous state")

        # Create the output directory, if not already exists
        if outdir and not os.path.exists(outdir):
            try:
                os.makedirs(outdir)
            except OSError:
                error(f"Creation of the directory {outdir} failed")
            outdir = os.path.abspath(outdir)

        # Store the results
        self._progress.pass_msg(f"Saving new inputs in '{outdir}'")
        for i, input_ in enumerate(inputs):
            input_.save(f"{outdir}/min_input_{i:04}.bin")

        return inputs

    def _run_instruction_passes(self, test_case: TestCaseProgram, inputs: List[InputData],
                                org_violation: Violation, outfile: str) -> TestCaseProgram:
        # create pass objects
        passes = self._instruction_passes
        pass_objs = [c(self._fuzzer, self.instruction_set_spec, self._progress) for c in passes]
        for pass_obj in pass_objs:
            pass_obj.set_ignore_list(self.ignore_list)
            pass_obj.set_violation(org_violation)

        # run passes
        for pass_obj in pass_objs:
            self._progress.pass_start(pass_obj.name)
            test_case = pass_obj.run(test_case, inputs)
            test_case.save(outfile)

        return test_case

    def _run_analysis_passes(self, test_case: TestCaseProgram, inputs: List[InputData],
                             org_violation: Violation, outfile: str) -> TestCaseProgram:
        # create pass objects
        passes = self._analysis_passes
        pass_objs = [c(self._fuzzer, self.instruction_set_spec, self._progress) for c in passes]
        for pass_obj in pass_objs:
            pass_obj.set_ignore_list(self.ignore_list)
            pass_obj.set_violation(org_violation)

        # run passes
        for pass_obj in pass_objs:
            self._progress.pass_start(pass_obj.name)
            test_case = pass_obj.run(test_case, inputs)
            test_case.save(outfile)

        return test_case


================================================
FILE: rvzr/postprocessing/pass_abc.py
================================================
""" File: Abstract interfaces for minimization passes and common functionality.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

import abc
import tempfile
from typing import TYPE_CHECKING, List, Final

from ..config import CONF

if TYPE_CHECKING:
    from ..fuzzer import Fuzzer
    from ..isa_spec import InstructionSet
    from ..tc_components.test_case_code import TestCaseProgram
    from ..tc_components.test_case_data import InputData
    from .progress_printer import ProgressPrinter


class BaseMinimizationPass(abc.ABC):
    """ Base class for all minimization passes. Provides common functionality """
    name: str = ""
    _fuzzer: Final[Fuzzer]
    _instruction_set_spec: Final[InstructionSet]
    _progress: Final[ProgressPrinter]
    _ignore_list: List[int]

    def __init__(self, fuzzer: Fuzzer, instruction_set_spec: InstructionSet,
                 progress: ProgressPrinter):
        self._fuzzer = fuzzer
        self._instruction_set_spec = instruction_set_spec
        self._progress = progress
        self._ignore_list = []

        self._comment_symbol = "#" if CONF.instruction_set == "x86-64" else "//"
        self._base_register = "r14" if CONF.instruction_set == "x86-64" else "x20"

    def set_ignore_list(self, ignore_list: List[int]) -> None:
        """ Set the list of input IDs to ignore """
        self._ignore_list = ignore_list

    def _get_test_case_from_instructions(self,
                                         instructions: List[str],
                                         path: str = "") -> TestCaseProgram:
        """
        Create a test case object from a list of instructions.
        The test case is stored in a file at the given path.
        :param instructions: List of instructions
        :param path: Path to store the test case; if empty, a temporary file is created
        :return: Test case object
        """
        # create a temporary file if no path is given
        if not path:
            with tempfile.NamedTemporaryFile(dir="/tmp/rvzr_minimize", delete=False) as fp:
                path = fp.name
        # print(path)

        # write the instructions to the file
        with open(path, "w+") as f:
            for line in instructions:
                f.write(line)
        tc = self._fuzzer.asm_parser.parse_file(path, self._fuzzer.code_gen,
                                                self._fuzzer.elf_parser)
        return tc

    def _check_for_violation(self, test_case: TestCaseProgram, inputs: List[InputData],
                             local_ignore_list: List[int]) -> bool:
        """
        Check if the test case triggers the violation.
        :param test_case: The test case to check
        :param inputs: List of inputs to use for verification
        :param ignore_list: List of input IDs to ignore
        :return: True if the violation is triggered, False otherwise
        """
        for _ in range(CONF.minimizer_retries):
            violation = self._fuzzer.fuzzing_round(test_case, inputs, local_ignore_list)
            if violation is not None:
                return True
        return False


================================================
FILE: rvzr/postprocessing/progress_printer.py
================================================
""" File: Printing of the minimization progress

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""


class ProgressPrinter():
    """
    A simple class to print progress in the terminal.
    Used to ensure that all minimization classes
    provide a uniform output.
    """
    line_width: int = 64
    curr_width: int = 0
    offset: int = 2
    pass_id: int = 0
    progress_bar_on: bool = False

    def pass_start(self, label: str, offset: int = 2) -> None:
        """ Start a new minimization pass """
        self.pass_id += 1
        self.offset = offset
        self.curr_width = 0
        self.progress_bar_on = False
        print(f"[PASS {self.pass_id}] {label}", flush=True)

    def pass_finish(self) -> None:
        """ Finish the current minimization pass """
        print("")  # finish the line

    def pass_msg(self, msg: str) -> None:
        """ Print a message related to the current pass """
        print(" " * self.offset + "> " + msg)
        self.progress_bar_on = False

    def next(self, success: bool) -> None:
        """ Print a progress bar """
        if not self.progress_bar_on:
            print("")
            self.progress_bar_on = True

        self.curr_width += 1
        if self.curr_width > self.line_width:
            print("\n", end="", flush=True)
            self.curr_width = self.offset

        if success:
            print(".", end="", flush=True)
        else:
            print("-", end="", flush=True)

    def global_msg(self, msg: str) -> None:
        """ Print a message that is not related to the current pass """
        print(f"[INFO] {msg}")


================================================
FILE: rvzr/py.typed
================================================


================================================
FILE: rvzr/sandbox.py
================================================
"""
File: Constants defining the memory layout for the data and code sandboxes,
      which should be identical between the executor and the model.
      See docs/sandbox.md for more information.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from enum import Enum
from typing import Dict, List, Tuple, TYPE_CHECKING

import numpy as np

if TYPE_CHECKING:
    from .tc_components.test_case_code import TestCaseProgram

PAGE_SIZE = 4096

SandboxAddr = int
DataAddr = SandboxAddr
CodeAddr = SandboxAddr
BaseAddrTuple = Tuple[DataAddr, CodeAddr]


# ==================================================================================================
# Area Enumerations
# ==================================================================================================
class DataArea(Enum):
    """
    Enumeration class representing data areas in the sandbox.
    """
    START = 0
    MACRO_STACK = 1
    UNDERFLOW_PAD = 2
    MAIN = 3
    FAULTY = 4
    REG_INIT = 5
    GPR = 6
    SIMD = 7
    OVERFLOW_PAD = 8
    RSP_INIT = 9


class CodeArea(Enum):
    """
    Enumeration class representing code areas in the sandbox.
    """
    START = 0
    MAIN = 1
    MACRO = 2


# ==================================================================================================
# Sandbox Layout Class
# ==================================================================================================
class SandboxLayout:
    """
    Layout of the data and code sandboxes. This class is responsible for ensuring
    consistency of memory layouts between the executor, the model, and the generators.
    """
    _data_start: DataAddr
    _data_end: DataAddr
    _code_start: CodeAddr
    _code_end: CodeAddr

    _data_addresses: List[Dict[DataArea, DataAddr]]
    _code_addresses: List[Dict[CodeArea, CodeAddr]]

    # NOTE: the constants in _DataAreaLayout and _CodeAreaLayout *must* be identical
    # to the actor_data_t and actor_code_t in executor (rvzr/executor_km/include/sandbox_manager.h)
    _DataAreaLayout = np.dtype(
        [
            ('MACRO_STACK', np.uint8, 64),
            ('UNDERFLOW_PAD', np.uint8, PAGE_SIZE - 64),
            ('MAIN', np.uint8, PAGE_SIZE),
            ('FAULTY', np.uint8, PAGE_SIZE),
            ('GPR', np.uint8, 64),  # 8 64-bit GPRs
            ('SIMD', np.uint8, 256),  # 8 256-bit YMMs
            ('OVERFLOW_PAD', np.uint8, PAGE_SIZE - 64 - 256),
        ],
        align=False,
    )

    _CodeAreaLayout = np.dtype(
        [
            ('MAIN', np.uint8, 2 * PAGE_SIZE),
            ('MACRO', np.uint8, PAGE_SIZE),
        ],
        align=False,
    )

    # ==============================================================================================
    # Constant Accessors
    # ==============================================================================================
    @classmethod
    def data_area_size(cls, area: DataArea) -> int:
        """
        Get the size of a specific area in the data sandbox.
        :param area: The area to get the size of.
        :return: The size of the area in bytes.
        """
        return cls._DataAreaLayout[area.name].itemsize

    @classmethod
    def data_area_offset(cls, area: DataArea) -> int:
        """
        Get the offset of a specific area in the data sandbox.
        :param area: The area to get the offset of.
        :return: The offset of the area in bytes.
        """
        if area == DataArea.START:
            return 0
        if area == DataArea.REG_INIT:
            return cls._DataAreaLayout.fields['GPR'][1]  # type: ignore
        if area == DataArea.RSP_INIT:
            return cls._DataAreaLayout.fields['FAULTY'][1] - 8  # type: ignore
        return cls._DataAreaLayout.fields[area.name][1]  # type: ignore

    @classmethod
    def data_size_per_actor(cls) -> int:
        """
        Get the size of the data sandbox for a single actor.
        :return: The size of the data sandbox for a single actor in bytes.
        """
        return cls._DataAreaLayout.itemsize

    @classmethod
    def code_area_size(cls, area: CodeArea) -> int:
        """
        Get the size of a specific area in the code sandbox.
        :param area: The area to get the size of.
        :return: The size of the area in bytes.
        """
        return cls._CodeAreaLayout[area.name].itemsize

    @classmethod
    def code_area_offset(cls, area: CodeArea) -> int:
        """
        Get the offset of a specific area in the code sandbox.
        :param area: The area to get the offset of.
        :return: The offset of the area in bytes.
        """
        if area == CodeArea.START:
            return 0
        return cls._CodeAreaLayout.fields[area.name][1]  # type: ignore

    @classmethod
    def code_size_per_actor(cls) -> int:
        """
        Get the size of the code sandbox for a single actor.
        :return: The size of the code sandbox for a single actor in bytes.
        """
        return cls._CodeAreaLayout.itemsize

    # ==============================================================================================
    # Object Interface
    # ==============================================================================================
    def __init__(self, bases: BaseAddrTuple, n_actors: int):
        # Data boundaries
        self._data_start = bases[0]
        self.data_size = self._DataAreaLayout.itemsize * n_actors
        self._data_end = bases[0] + self.data_size
        assert self.data_size % PAGE_SIZE == 0

        # Code boundaries
        self._code_start = bases[1]
        self.code_size = self._CodeAreaLayout.itemsize * n_actors
        self._code_end = bases[1] + self.code_size
        assert self.code_size % PAGE_SIZE == 0

        # Pre-compute data and code addresses
        # Note: This is makes sense because we assume that the object will be initialized
        # once and used many times.
        self._data_addresses = []
        for actor_id in range(n_actors):
            actor_data_start = self._data_start + actor_id * self.data_size_per_actor()
            self._data_addresses.append(
                {area: actor_data_start + self.data_area_offset(area) for area in DataArea})
        self._code_addresses = []
        for actor_id in range(n_actors):
            actor_code_start = self._code_start + actor_id * self.code_size_per_actor()
            self._code_addresses.append(
                {area: actor_code_start + self.code_area_offset(area) for area in CodeArea})

    def code_start(self) -> CodeAddr:
        """ Read-only access to the code start address """
        return self._code_start

    def code_end(self) -> CodeAddr:
        """ Read-only access to the code end address """
        return self._code_end

    def data_start(self) -> DataAddr:
        """ Read-only access to the data start address """
        return self._data_start

    def data_end(self) -> DataAddr:
        """ Read-only access to the data end address """
        return self._data_end

    def get_data_addr(self, area: DataArea, actor_id: int) -> DataAddr:
        """
        Get the starting address of a specific area in the data sandbox for a given actor.
        :param area: The area to get the address of.
        :param actor_id: The actor to get the address for.
        :return: The starting address of the area in the data sandbox.
        """
        actor_data_start = self._data_start + actor_id * self.data_size_per_actor()
        return actor_data_start + self.data_area_offset(area)

    def get_code_addr(self, area: CodeArea, actor_id: int) -> CodeAddr:
        """
        Get the starting address of a specific area in the code sandbox for a given actor.
        :param area: The area to get the address of.
        :param actor_id: The actor to get the address for.
        :return: The starting address of the area in the code sandbox.
        """
        actor_code_start = self._code_start + actor_id * self.code_size_per_actor()
        return actor_code_start + self.code_area_offset(area)

    def get_exit_addr(self, test_case: TestCaseProgram) -> CodeAddr:
        """
        Get the address of the exit instruction in the code sandbox for a given test case.
        :param test_case: The test case to get the exit address for.
        :return: The exit address
        """
        main_section = test_case.find_section(name="main")
        main_size = main_section.get_elf_data()["size"]
        exit_offset = self._code_start + main_size - 1
        return exit_offset

    def is_data_addr(self, addr: DataAddr) -> bool:
        """
        Check if the given address is within the data sandbox.
        :param addr: The address to check.
        :return: True if the address is within the data sandbox, False otherwise.
        """
        return self._data_start <= addr < self._data_end

    def is_code_addr(self, addr: CodeAddr) -> bool:
        """
        Check if the given address is within the code sandbox.
        :param addr: The address to check.
        :return: True if the address is within the code sandbox, False otherwise.
        """
        return self._code_start <= addr < self._code_end

    def data_addr_to_offset(self, addr: DataAddr) -> DataAddr:
        """
        Convert the given address to an offset within the data sandbox.
        :param addr: The address to convert.
        :return: The offset within the data sandbox.
        """
        return addr - self._data_start

    def code_addr_to_offset(self, addr: CodeAddr) -> CodeAddr:
        """
        Convert the given address to an offset within the code sandbox.
        :param addr: The address to convert.
        :return: The offset within the code sandbox.
        """
        return addr - self._code_start

    def code_addr_to_actor_id(self, addr: CodeAddr) -> int:
        """
        Given a code address, identify the actor ID that the code address belongs to.
        :param addr: Code address
        :return: Actor ID
        """
        return (addr - self._code_start) // self.code_size_per_actor()

    def data_addr_to_actor_id(self, addr: DataAddr) -> int:
        """
        Given a data address, identify the actor ID that the data address belongs to.
        :param addr: Data address
        :return: Actor ID
        """
        return (addr - self._data_start) // self.data_size_per_actor()


================================================
FILE: rvzr/stats.py
================================================
""" File: Global statistics class

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import Any, Dict


class FuzzingStats:
    """
    Class responsible for storing and managing fuzzing statistics.
    Implements the Borg pattern to share the state between instances.
    """
    _borg_shared_state: Dict[Any, Any] = {}

    test_cases: int = 0
    num_inputs: int = 0
    eff_classes: int = 0
    single_entry_classes: int = 0
    violations: int = 0
    analysed_test_cases: int = 0
    executor_reruns: int = 0

    spec_filter: int = 0
    observ_filter: int = 0
    fast_path: int = 0
    fp_nesting: int = 0
    fp_taint_mistakes: int = 0
    fp_early_priming: int = 0
    fp_large_sample: int = 0
    fp_priming: int = 0

    # Implementation of Borg pattern
    def __init__(self) -> None:
        self.__dict__ = self._borg_shared_state

    def __str__(self) -> str:
        total_clss = self.eff_classes + self.single_entry_classes
        total_clss_per_test_case = total_clss / self.analysed_test_cases \
            if self.analysed_test_cases else 0
        effective_clss = self.eff_classes / self.analysed_test_cases \
            if self.analysed_test_cases else 0
        iptc = self.num_inputs / self.test_cases if self.test_cases else 0

        s = ""
        s += f"Test Cases: {self.test_cases}\n"
        s += f"Inputs per test case: {iptc:.1f}\n"
        s += f"Violations: {self.violations}\n"
        s += "Effectiveness: \n"
        s += f"  Total Cls: {total_clss_per_test_case:.1f}\n"
        s += f"  Effective Cls: {effective_clss:.1f}\n"
        s += "Discarded Test Cases:\n"
        s += f"  Speculation Filter: {self.spec_filter}\n"
        s += f"  Observation Filter: {self.observ_filter}\n"
        s += f"  Fast Path: {self.fast_path}\n"
        s += f"  Max Nesting Check: {self.fp_nesting}\n"
        s += f"  Tainting Check: {self.fp_taint_mistakes}\n"
        s += f"  Early Priming Check: {self.fp_early_priming}\n"
        s += f"  Large Sample Check: {self.fp_large_sample}\n"
        s += f"  Priming Check: {self.fp_priming}\n"
        return s

    def get_brief(self) -> str:
        """ Return a brief one-line summary of the statistics """

        if self.test_cases == 0:
            return ""

        if self.analysed_test_cases:
            all_cls = (self.eff_classes + self.single_entry_classes) // self.analysed_test_cases
            eff_cls = self.eff_classes // self.analysed_test_cases
        else:
            all_cls = 0
            eff_cls = 0
        executor_reruns = self.executor_reruns // self.num_inputs
        s = f"Cls:{eff_cls}/{all_cls},"
        s += f"In:{self.num_inputs // self.test_cases},"
        s += f"R:{executor_reruns},"
        s += f"SF:{self.spec_filter},"
        s += f"OF:{self.observ_filter},"
        s += f"Fst:{self.fast_path}," \
             f"CN:{self.fp_nesting}," \
             f"CT:{self.fp_taint_mistakes}," \
             f"P1:{self.fp_early_priming}," \
             f"CS:{self.fp_large_sample}," \
             f"P2:{self.fp_priming}," \
             f"V:{self.violations}"
        return s


================================================
FILE: rvzr/target_desc.py
================================================
"""
File: Architectural details of the target platform,
such as register sizes, register names, and CPU description.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from abc import ABC, abstractmethod
from typing import Dict, List, Tuple, NamedTuple, Literal, TYPE_CHECKING
import subprocess

from rvzr.config import CONF, PagePropertyName

if TYPE_CHECKING:
    from .tc_components.instruction import Instruction, RegSize

# ==================================================================================================
# Custom Types
# ==================================================================================================
Vendor = Literal["Intel", "AMD", "ARM", "Unknown"]
RegName = str
RegNormalizedName = str
RegUnicornID = int
PTEBitName = Literal["present", "writable", "non_writable", "user", "write-through",
                     "cache-disable", "accessed", "dirty", "reserved_bit", "executable",
                     "non_executable", "valid"]
PTEBitOffset = int
PTEBitNameMapper = Dict[PagePropertyName, Tuple[PTEBitName, bool]]


# ==================================================================================================
# Use-case Specific Descriptors
# ==================================================================================================
class CPUDesc(NamedTuple):
    """ CPU description. """

    vendor: Vendor
    model: int
    family: int
    stepping: int


class MacroSpec(NamedTuple):
    """ Macro specification. """

    type_: int
    name: str
    args: Tuple[str, str, str, str]


class UnicornTargetDesc:  # pylint: disable=too-few-public-methods
    """ Target description in the context of a Unicorn-based model """

    usable_registers: List[RegUnicornID]
    """ List of Unicorn register IDs that are used by test cases on the target platform. """

    usable_simd128_registers: List[RegUnicornID]
    """ List of Unicorn SIMD register IDs that are used by test cases on the target platform. """

    reg_str_to_constant: Dict[RegName, RegUnicornID]
    """ Mapping from register names to their Unicorn constants. """

    reg_norm_to_constant: Dict[RegNormalizedName, RegUnicornID]
    """ Mapping from normalized register names to their Unicorn constants. """

    barriers: List[str]
    """ List of instruction names that are considered as speculation barriers """

    flags_register: RegUnicornID
    """ Unicorn register ID of the flags register """

    pc_register: RegUnicornID
    """ Unicorn register ID of the program counter register """

    sp_register: RegUnicornID
    """ Unicorn register ID of the stack pointer register """

    actor_base_register: RegUnicornID
    """ Unicorn register ID of the register that holds the base address of the active actor """


# ==================================================================================================
# Main Target Description
# ==================================================================================================
class TargetDesc(ABC):
    """ Abstract class defining the interface to target description classes. """

    cpu_desc: CPUDesc
    """ Target CPU description. """

    # List of macro specifications. All macros are cross-platform, hence the same for all targets.
    macro_specs: Dict[str, MacroSpec] = {
        # macros with negative IDs are used for generation
        # and are not supposed to reach the final binary
        "random_instructions":
            MacroSpec(-1, "random_instructions", ("int", "int", "", "")),

        # macros with positive IDs are used for execution and can be interpreted by executor/model
        "function":
            MacroSpec(0, "function", ("", "", "", "")),
        "measurement_start":
            MacroSpec(1, "measurement_start", ("", "", "", "")),
        "measurement_end":
            MacroSpec(2, "measurement_end", ("", "", "", "")),
        "fault_handler":
            MacroSpec(3, "fault_handler", ("", "", "", "")),
        "switch":
            MacroSpec(4, "switch", ("actor_id", "function_id", "", "")),
        "set_k2u_target":
            MacroSpec(5, "set_k2u_target", ("actor_id", "function_id", "", "")),
        "switch_k2u":
            MacroSpec(6, "switch_k2u", ("actor_id", "", "", "")),
        "set_u2k_target":
            MacroSpec(7, "set_u2k_target", ("actor_id", "function_id", "", "")),
        "switch_u2k":
            MacroSpec(8, "switch_u2k", ("actor_id", "", "", "")),
        "set_h2g_target":
            MacroSpec(9, "set_h2g_target", ("actor_id", "function_id", "", "")),
        "switch_h2g":
            MacroSpec(10, "switch_h2g", ("actor_id", "", "", "")),
        "set_g2h_target":
            MacroSpec(11, "set_g2h_target", ("actor_id", "function_id", "", "")),
        "switch_g2h":
            MacroSpec(12, "switch_g2h", ("actor_id", "", "", "")),
        "landing_k2u":
            MacroSpec(13, "landing_k2u", ("", "", "", "")),
        "landing_u2k":
            MacroSpec(14, "landing_u2k", ("", "", "", "")),
        "landing_h2g":
            MacroSpec(15, "landing_h2g", ("", "", "", "")),
        "landing_g2h":
            MacroSpec(16, "landing_g2h", ("", "", "", "")),
        "set_data_permissions":
            MacroSpec(18, "set_data_permissions", ("actor_id", "int", "int", ""))
        # FIXME: macro IDs should not be hardcoded but rather received from the executor
        # or at least we need a test that will check that the IDs match
    }

    uc_target_desc: UnicornTargetDesc
    """ Target description in the context of a Unicorn-based model """

    register_sizes: Dict[RegName, RegSize]
    """ Dictionary mapping register names to their sizes in bits. """

    registers_by_size: Dict[RegSize, List[RegName]]
    """ Dictionary with lists of all registers for a given size. """

    reg_normalized: Dict[RegName, RegNormalizedName]
    """ Mapping from full register names to normalized size-independent names. E.g., rax -> A"""

    reg_denormalized: Dict[RegNormalizedName, Dict[RegSize, RegName]]
    """ Reverse mapping from normalized names to full register names.
    E.g., A -> {64: rax, 32: eax, 16: ax, 8: al} """

    page_property_to_pte_bit_name: PTEBitNameMapper
    """
    Dictionary mapping architecture-independent page property names to architecture-specific
    page table entry bit names together with a bit indicating whether the property is inverted.
    E.g.,
        'writable' -> ('writable', False)
        'executable' -> ('non_executable', True)
    """

    pte_bits: Dict[PTEBitName, Tuple[PTEBitOffset, bool]]
    """
    Dictionary mapping page table entry field names to their bit offsets and their default values.
    """

    page_property_to_vm_pte_bit_name: PTEBitNameMapper
    """
    Dictionary mapping architecture-independent page property names to architecture-specific
    VM page table entry bit names. This is the unified mapping for both Intel EPT and AMD NPT.
    """

    vm_pte_bits: Dict[PTEBitName, Tuple[PTEBitOffset, bool]]
    """
    Dictionary mapping VM page table entry field names to their bit offsets
    and their default values. This is the unified interface for various types of host-to-guest
    page tables, such as Intel EPT and AMD NPT.
    """

    branch_conditions: Dict[str, List[str]]
    """ Dictionary mapping branch instructions to their condition codes. """

    mem_index_registers: List[RegName]
    """ List of register that can be used as memory index registers. """

    @classmethod
    def get_vendor(cls) -> Vendor:
        """ Read the CPU vendor from lscpu """
        output = subprocess.check_output("lscpu", shell=True)
        if b"Intel" in output:
            return "Intel"
        if b"AMD" in output:
            return "AMD"
        if b"ARM" in output:
            return "ARM"
        return "Unknown"

    @staticmethod
    @abstractmethod
    def is_unconditional_branch(inst: Instruction) -> bool:
        """ Check if the instruction is an unconditional branch. """

    @staticmethod
    @abstractmethod
    def is_call(inst: Instruction) -> bool:
        """ Check if the instruction is a call. """

    def get_macro_spec_from_type(self, type_: int) -> MacroSpec:
        """
        Get the macro specification of a given macro type.
        :param type_: macro type
        :return: macro specification
        """
        for macro_spec in self.macro_specs.values():
            if macro_spec.type_ == type_:
                return macro_spec
        raise KeyError(f"Unknown macro type: {type_}")

    def _filter_blocked_registers(self) -> Dict[RegSize, List[str]]:
        """ Filter function used to remove blocked registers. Invoked by subclasses. """

        filtered_decoding: Dict[RegSize, List[str]] = {}
        for size, registers in self.registers_by_size.items():
            filtered_decoding[size] = []
            for register in registers:
                if register not in CONF.register_blocklist or register in CONF.register_allowlist:
                    filtered_decoding[size].append(register)
        return filtered_decoding


================================================
FILE: rvzr/tc_components/__init__.py
================================================
"""
File: Module containing a collection of classes that represent components
      of a test case (both code and data).

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# flake8: noqa
# pylint: skip-file

from .actor import *
from .instruction import *
from .test_case_code import *
from .test_case_data import *


================================================
FILE: rvzr/tc_components/actor.py
================================================
"""
File: Classes defining the actor abstraction.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import Dict, Tuple, Final, Optional, TYPE_CHECKING
from enum import Enum
import random

from ..target_desc import TargetDesc, PTEBitName, PTEBitOffset

if TYPE_CHECKING:
    from ..config import PageConf, PagePropertyName, ActorConf
    from .test_case_code import CodeSection

    _PTEBitValue = bool
    _PTEDescriptor = Dict[PTEBitName, Tuple[PTEBitOffset, _PTEBitValue]]
    _PropertyMap = Dict[PagePropertyName, Tuple[PTEBitName, bool]]

ActorID = int
ActorName = str
PTEMask = int


class ActorMode(Enum):
    """ Enumeration class representing the execution mode of an actor (host or guest). """
    HOST = 0
    GUEST = 1


class ActorPL(Enum):
    """ Enumeration class representing the privilege level of an actor (kernel or user). """
    KERNEL = 0
    USER = 1


# ==================================================================================================
# Helper Functions to manage actor data properties
# ==================================================================================================
def _create_pte_mask(pte_descriptor: _PTEDescriptor, page_properties_to_set: PageConf,
                     page_property_to_pte_bit_name: _PropertyMap) -> PTEMask:
    """
    Create an architecture-specific page table entry (PTE) bitmask based on the actor's
    architecture-independent data properties. This bitmask is to be used by the executor
    and the model to set page table properties of actors.

    The function takes a dictionary `pte_descriptor` that describes each bit of the PTE for
    the target architecture. Each entry in the dictionary maps a bit name to a tuple containing
    the bit's offset in the PTE and its default value.

    The function modifies the default values based on the `page_properties_to_set` dictionary,
    which specifies the desired properties for the page table entry (this typically originates
    from config.yaml).

    As the names of the properties in `page_properties_to_set` may differ from the names used in
    the `pte_descriptor`, the function uses the `page_property_to_pte_bit_name` mapping to
    translate between the two.

    Optionally, if `page_properties_to_set['randomized']` is True, the function introduces
    randomness in the bitmask generation. Each bit has a chance of being set to its default
    value, with the probability proportional to the number of bits that differ from their
    default values.

    :param pte_descriptor: dictionary of default values for PTE bits
    :param page_properties_to_set: dictionary of page properties to set
    :param page_property_to_pte_bit_name: mapping from property names to PTE bit names
    :return: bitmask representing the PTE properties
    :raises: AssertionError if the properties dictionary is invalid
    """
    # pylint: disable=too-many-locals  # justification: function is complex but clear

    is_randomized = page_properties_to_set['randomized']

    # First, translate the architecture-independent properties to architecture-specific ones
    arch_specific_properties: Dict[PTEBitName, bool] = {}
    for property_name, value in page_properties_to_set.items():
        if property_name == 'randomized':
            continue
        assert property_name in page_property_to_pte_bit_name, \
            f"Actor data property {property_name} is not supported on this architecture"
        bit_name, is_inverted = page_property_to_pte_bit_name[property_name]
        if is_inverted:
            value = not value
        arch_specific_properties[bit_name] = value

    # If randomization is requested, calculate the probability of a bit being set to default value
    probability_of_default = 0.0
    if is_randomized:
        # calculate the number of non-default bits
        count_non_default = 0
        for bit_name in pte_descriptor:
            if pte_descriptor[bit_name][1] != arch_specific_properties[bit_name]:
                count_non_default += 1

        # the probability is proportional to the number of non-default bits
        # we use a formula that maps the probability in the range of roughly [0.5, 0.8] to
        # avoid having too low or too high probabilities
        a = count_non_default
        b = len(pte_descriptor)
        probability_of_default = (a / (a + b)) * 0.5 + 0.5

    # create the mask
    mask: PTEMask = 0
    for bit_name, new_value in arch_specific_properties.items():
        # get the bit offset and default value from the PTE descriptor
        bit_offset, default_value = pte_descriptor[bit_name]

        # The new value of the bit is either directly taken from the properties dictionary,
        # or it is randomly set to the default value based on the probability calculated above.
        bit_value: int
        if not is_randomized or new_value == default_value:
            bit_value = new_value
        else:
            set_to_default = random.random() < probability_of_default
            if set_to_default:
                bit_value = default_value
            else:
                bit_value = new_value

        # now set the bit in the mask
        bit_value = 1 if bit_value else 0
        mask |= bit_value << bit_offset
    return mask


# ==================================================================================================
# Actor Class
# ==================================================================================================
class Actor:
    """ Class representing an actor in a test case. """

    mode: Final[ActorMode]
    privilege_level: Final[ActorPL]
    name: Final[ActorName]
    data_properties: Final[PTEMask]
    data_ept_properties: Final[PTEMask]
    observer: Final[bool]
    is_main: Final[bool]

    _code_section: Optional[CodeSection] = None

    # ==============================================================================================
    # Constructors

    def __init__(self,
                 mode: ActorMode,
                 pl: ActorPL,
                 name: ActorName,
                 data_properties: PTEMask = 0,
                 data_ept_properties: PTEMask = 0,
                 is_observer: bool = False) -> None:
        self.mode = mode
        self.privilege_level = pl
        self.name = name
        self.data_properties = data_properties
        self.data_ept_properties = data_ept_properties
        self.observer = is_observer
        self.is_main = name == "main"

    @classmethod
    def from_dict(cls, actor_dict: ActorConf, target_desc: TargetDesc) -> 'Actor':
        """
        Create an actor based on a dictionary of actor properties.
        :param actor_dict: dictionary of actor properties
        :param target_desc: target description
        :return: Actor object
        :raises: ValueError if actor_dict is malformed
        """
        # actor mode of execution
        if actor_dict['mode'] == "host":
            mode = ActorMode.HOST
        elif actor_dict['mode'] == "guest":
            mode = ActorMode.GUEST
        else:
            raise ValueError(f"Invalid actor mode: {actor_dict['mode']}")

        # privilege level
        if actor_dict['privilege_level'] == "kernel":
            pl = ActorPL.KERNEL
        elif actor_dict['privilege_level'] == "user":
            pl = ActorPL.USER
        else:
            raise ValueError(f"Invalid actor privilege level: {actor_dict['privilege_level']}")

        # PTE and EPTE properties
        data_properties = _create_pte_mask(
            target_desc.pte_bits,
            actor_dict["data_properties"],
            target_desc.page_property_to_pte_bit_name,
        )
        data_ept_properties = _create_pte_mask(
            target_desc.vm_pte_bits,
            actor_dict["data_ept_properties"],
            target_desc.page_property_to_vm_pte_bit_name,
        )

        # create the actor
        return Actor(
            mode,
            pl,
            actor_dict["name"],
            data_properties=data_properties,
            data_ept_properties=data_ept_properties,
            is_observer=actor_dict["observer"],
        )

    @classmethod
    def create_main(cls) -> 'Actor':
        """
        Create the main actor with default properties.
        :return: Actor object
        """
        return Actor(ActorMode.HOST, ActorPL.KERNEL, "main")

    # ==============================================================================================
    # Public methods
    def assign_code_section(self, section: CodeSection) -> None:
        """ Assign a code section to the actor. """
        assert self._code_section is None, f"Code section already assigned to actor {self.name}"
        self._code_section = section

    def code_section(self) -> CodeSection:
        """ Get the code section assigned to the actor. """
        assert self._code_section is not None, f"Code section not assigned to actor {self.name}"
        return self._code_section

    def get_id(self) -> ActorID:
        """
        Get the actor ID.
        :return: actor ID
        :raises: AssertionError if the ELF section has not been assigned
        """
        assert self._code_section is not None, f"Code section not assigned to actor {self.name}"
        assert self._code_section.id_ is not None, \
            "assign_elf_data was not called on the child CodeSection"
        return self._code_section.id_


================================================
FILE: rvzr/tc_components/instruction.py
================================================
"""
File: Collection of classes to represent instructions in a test case program and their components.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from abc import ABC
from dataclasses import dataclass
from typing import List, Optional, Final, Literal, Union, Type, Tuple, get_args, cast
from typing_extensions import assert_never

from ..instruction_spec import OT, InstructionSpec, OperandSpec

FlagType = Literal['r', 'w', 'r/w', 'r/cw', 'undef']
RegSize = Literal[8, 16, 32, 64, 128, 256]


# ==================================================================================================
# Operands
# ==================================================================================================
@dataclass
class Operand(ABC):
    """ Operand of an instruction """

    value: str
    """ The value of the operand, e.g., name of a register, memory address, etc. """

    src: Final[bool]
    """ If True, the operand is a source operand """

    dest: Final[bool]
    """ If True, the operand is a destination operand """

    has_magic_value: bool = False
    """
    If True, the operand value has special meaning for the parent instruction.
    Special meaning is normally a separate opcode or encoding,
    such as when shift by 1 is a separate opcode.
    """

    def __init__(self, value: str, src: bool, dest: bool):
        self.value = value.lower()
        self.src = src
        self.dest = dest
        super().__init__()

    @classmethod
    def from_fixed_spec(cls, spec: OperandSpec) -> AnyOperand:  # pylint: disable=r1710,r0911
        """
        Create an Operand instance from a fixed operand specification.
        Fixed means that the specification does not have any multiple-option fields
        (e.g., only one possible value).
        :param spec: The operand specification
        :return: The Operand instance of the type that corresponds to the specification
        """
        # NOTE on pylint disable above:
        # - r1710 - mitigates a false positive due to assert_never
        # - r0911 - the large number of returns is a good design choice here

        assert len(spec.values) <= 1 or spec.type == OT.FLAGS, \
            f"Attempt to call from_fixed_spec with a non-fixed spec {spec.values}"
        value = spec.values[0] if spec.values else ""
        if spec.type == OT.REG:
            return RegisterOp(value, spec.width, spec.src, spec.dest)
        if spec.type == OT.MEM:
            return MemoryOp(value, spec.width, spec.src, spec.dest)
        if spec.type == OT.IMM:
            return ImmediateOp(value, spec.width)
        if spec.type == OT.LABEL:
            return LabelOp(value)
        if spec.type == OT.AGEN:
            return AgenOp(value, spec.width)
        if spec.type == OT.FLAGS:
            return FlagsOp(spec.values)
        if spec.type == OT.COND:
            return CondOp(value)
        assert_never(spec.type)
        # unreachable, hence no return


class RegisterOp(Operand):
    """ Register operand of an instruction """

    width: Final[RegSize]

    def __init__(self, value: str, width: int, src: bool, dest: bool):
        assert width in get_args(RegSize), f"Invalid register width {width} for register {value}"
        self.width = cast(RegSize, width)
        super().__init__(value, src, dest)


class MemoryOp(Operand):
    """ Memory operand of an instruction """

    width: Final[int]

    def __init__(self, address: str, width: int, src: bool, dest: bool) -> None:
        self.width = width
        super().__init__(address, src, dest)

    def get_base_register(self) -> Optional[RegisterOp]:
        """
        Get the base register of the memory operand, if any.
        E.g., for [rax + 8], return rax.
        :return: The base register, or None if there is no base register
        """
        addr = self.value.strip()

        # Split by + and - to find base register
        tokens = [t.strip() for t in addr.replace('-', '+').split('+')]

        # Filter out numeric tokens
        tokens = [t for t in tokens if not t.replace('0x', '').isdigit()]
        tokens = [t for t in tokens if not t.replace('0b', '').isdigit()]

        for t in tokens:
            # the first non-numeric token is the base register
            return RegisterOp(t.lower(), self.width, True, False)
        return None


class ImmediateOp(Operand):
    """ Immediate operand of an instruction """

    width: Final[int]

    def __init__(self, value: str, width: int) -> None:
        self.width = width
        super().__init__(value, True, False)


class LabelOp(Operand):
    """ Label operand of an instruction """

    def __init__(self, value: str) -> None:
        super().__init__(value, True, False)


class AgenOp(Operand):
    """ Address generation operand of an instruction (used by LEA instruction) """

    width: Final[int]

    def __init__(self, value: str, width: int) -> None:
        self.width = width
        super().__init__(value, True, False)


class FlagsOp(Operand):
    """ Flags operand of an instruction """

    _flag_values: Final[Tuple[str, ...]]
    _flag_names: Final[Tuple[str, ...]] = ("CF", "PF", "AF", "ZF", "SF", "TF", "IF", "DF", "OF")

    def __init__(self, value: Tuple[str, ...]) -> None:
        assert len(value) == len(self._flag_names)
        self._flag_values = value
        super().__init__("FLAGS", False, False)

    def __str__(self) -> str:
        return "FLAGS: " \
               f"{self._flag_names[0]}{self._flag_values[0]}|" \
               f"{self._flag_names[1]}{self._flag_values[1]}|" \
               f"{self._flag_names[2]}{self._flag_values[2]}|" \
               f"{self._flag_names[3]}{self._flag_values[3]}|" \
               f"{self._flag_names[4]}{self._flag_values[4]}|" \
               f"{self._flag_names[5]}{self._flag_values[5]}|" \
               f"{self._flag_names[6]}{self._flag_values[6]}|" \
               f"{self._flag_names[7]}{self._flag_values[7]}|" \
               f"{self._flag_names[8]}{self._flag_values[8]}"

    def _get_flag_list(self, types: List[FlagType]) -> List[str]:
        """
        Get a list of flags with the specified types.
        :param types: A list of flag types to include
        :return: A list of flags
        """
        flags = []
        for i, type_ in enumerate(self._flag_values):
            if type_ in types:
                flags.append(self._flag_names[i])
        return flags

    def get_flags_by_type(self, type_: Literal['read', 'write', 'overwrite', 'undef']) -> List[str]:
        """
        Get a list of flags with the specified types.
        :param types: Type of flags to include (read, write, overwrite, undef)
        :return: A list of flags
        """
        flag_types: List[FlagType]
        if type_ == "read":
            flag_types = ['r', 'r/w', 'r/cw']
        elif type_ == "write":
            flag_types = ['w', 'r/w', 'r/cw']
        elif type_ == "overwrite":
            flag_types = ['w']
        elif type_ == "undef":
            flag_types = ['undef']
        else:
            assert_never(type_)

        return self._get_flag_list(flag_types)


@dataclass
class CondOp(Operand):
    """ Condition operand of an instruction """

    def __init__(self, value: str) -> None:
        super().__init__(value, True, False)


# ==================================================================================================
# Operand Modification Interface
# ==================================================================================================
_ValueModifiableOperand = Union[RegisterOp, MemoryOp, ImmediateOp, LabelOp, AgenOp, CondOp]
_SrcDestModifiableOperand = Union[RegisterOp, MemoryOp]
AnyOperand = Union[RegisterOp, MemoryOp, ImmediateOp, LabelOp, AgenOp, CondOp, FlagsOp]


def copy_op_with_value_modification(op: _ValueModifiableOperand,
                                    value: str) -> _ValueModifiableOperand:
    """
    Make a copy of an operand with a modification to its value
    :param op: The operand to copy
    :param value: The new value of the operand
    :return: The modified operand
    """
    if isinstance(op, RegisterOp):
        return RegisterOp(value, op.width, op.src, op.dest)
    if isinstance(op, MemoryOp):
        return MemoryOp(value, op.width, op.src, op.dest)
    if isinstance(op, ImmediateOp):
        return ImmediateOp(value, op.width)
    if isinstance(op, LabelOp):
        return LabelOp(value)
    if isinstance(op, AgenOp):
        return AgenOp(value, op.width)
    if isinstance(op, CondOp):
        return CondOp(value)
    assert_never(op)


def copy_op_with_flow_modification(op: _SrcDestModifiableOperand,
                                   src: Optional[bool] = None,
                                   dest: Optional[bool] = None) -> _SrcDestModifiableOperand:
    """
    Make a copy of an operand with modifications to its flow properties
    :param op: The operand to copy
    :param src: If not None, the new src property of the operand
    :param dest: If not None, the new dest property of the operand
    :return: The modified operand
    """
    if src is None:
        src = op.src
    if dest is None:
        dest = op.dest

    if isinstance(op, RegisterOp):
        return RegisterOp(op.value, op.width, src, dest)
    if isinstance(op, MemoryOp):
        return MemoryOp(op.value, op.width, src, dest)
    assert_never(op)


# ==================================================================================================
# Instructions and Symbols
# ==================================================================================================
class Instruction:
    """ Instruction in a test case program """

    # pylint: disable=too-many-instance-attributes
    # NOTE: This is a data container class, so it is expected to have many attributes
    # pylint: disable=too-many-public-methods
    # NOTE: This contains separate accessors for each operand type,
    # so it is expected to have many methods

    name: Final[str]
    """ name: The name of the instruction without any operands """
    category: Final[str]
    """ category: The category of the instruction, e.g., BASE-BINARY. The keyword matches
    the category in the instruction set description file (typically called base.json)"""

    is_control_flow: Final[bool]
    """ _control_flow: If True, the instruction is a control flow instruction
    (branch, call, return, etc.) """
    is_instrumentation: Final[bool]
    """ _is_instrumentation: If True, the instruction is an instrumentation instruction,
    which means that it was inserted by the generator to prevent faults or false positives """
    is_noremove: Final[bool]
    """ is_noremove: If True, the instruction should be skipped while doing minimization passes """
    is_from_template: bool = False
    """ is_from_template: If True, the instruction was directly copied from the template rather
    then being automatically created by the generator. """
    is_macro_placeholder: bool = False
    """ is_macro_placeholder: If True, this instruction is a part of a placeholder that will be
    replaced by a macro call in the executor/model; this instruction is expected to be a NOP.
    For most instructions, this is always False. """

    operands: Final[List[AnyOperand]]
    """ operands: List of explicit operands of the instruction """
    implicit_operands: Final[List[AnyOperand]]
    """ implicit_operands: List of implicit operands, which are not explicitly specified in the
    instruction but are used by the instruction. For example, flags operand in x86 instructions """

    _line_num: int = -1  # line number in the source asm; access via line_num()
    _section_id: int = -1  # section ID in the object file; access via section_id()
    _section_offset: int = -1  # instruction offset in the section; access via section_offset()
    _size: int = -1  # size of the instruction in bytes; access via size()
    _inst_brief: str = ""  # cached brief representation of the instruction

    # ----------------------------------------------------------------------------------------------
    # Constructors

    def __init__(self,
                 name: str,
                 category: str = "",
                 is_control_flow: bool = False,
                 is_instrumentation: bool = False,
                 is_noremove: bool = False) -> None:
        self.name = name
        self.category = category
        self.is_control_flow = is_control_flow
        self.is_instrumentation = is_instrumentation
        self.is_noremove = is_noremove

        self.operands = []
        self.implicit_operands = []

    @classmethod
    def from_spec(cls: Type[Instruction],
                  sp: InstructionSpec,
                  is_instrumentation: bool = False,
                  is_noremove: bool = False) -> Instruction:
        """
        Create an instruction with NO OPERANDS from an instruction specification.
        :param spec: The instruction specification
        :param is_instrumentation: If True, the instruction is an instrumentation instruction
        :param is_noremove: If True, the instruction be kept during minimization
        :return: The instruction
        """
        obj = cls(
            sp.name,
            sp.category,
            sp.is_control_flow,
            is_instrumentation=is_instrumentation,
            is_noremove=is_noremove)
        return obj

    # ----------------------------------------------------------------------------------------------
    # Printing

    def __str__(self) -> str:
        op_list = [
            "[" + o.value + "]" if isinstance(o, MemoryOp) else o.value for o in self.operands
        ]
        operands = ', '.join(op_list)
        return f"{self.name} {operands}"

    # ----------------------------------------------------------------------------------------------
    # Operand Management

    def add_op(self, op: AnyOperand, implicit: bool = False) -> Instruction:
        """
        Add operand to the instruction. Returns the instruction for chaining.
        :param op: Operand to add
        :param implicit: If True, the operand is implicit
        :return: The instruction
        """
        if not implicit:
            self.operands.append(op)
        else:
            self.implicit_operands.append(op)
        return self

    def has_mem_operand(self, include_implicit: bool) -> bool:
        """
        Check if the instruction has a memory operand.
        :param include_implicit: If True, include implicit operands in the check
        :return: True if the instruction has a memory operand, False otherwise
        """
        for o in self.operands:
            if isinstance(o, MemoryOp):
                return True
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, MemoryOp):
                    return True
        return False

    def has_write(self, include_implicit: bool = False) -> bool:
        """
        Check if the instruction has a memory operand that writes to memory.
        :param include_implicit: If True, include implicit operands in the check
        :return: True if the instruction has a memory operand that writes to memory, False otherwise
        """
        for o in self.operands:
            if isinstance(o, MemoryOp) and o.dest:
                return True
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, MemoryOp) and o.dest:
                    return True
        return False

    def has_read(self, include_implicit: bool = False) -> bool:
        """
        Check if the instruction has a memory operand that reads from memory.
        :param include_implicit: If True, include implicit operands in the check
        :return: True if the instruction has a memory operand that reads memory, False otherwise
        """
        for o in self.operands:
            if isinstance(o, MemoryOp) and o.src:
                return True
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, MemoryOp) and o.src:
                    return True
        return False

    def get_all_operands(self) -> List[AnyOperand]:
        """
        Get a list of all operands of the instruction,
        including both explicit and implicit operands.
        :return: A list of all operands
        """
        return self.operands + self.implicit_operands

    def get_src_operands(self, include_implicit: bool = False) -> List[AnyOperand]:
        """
        Get a list of source operands of the instruction.
        :param include_implicit: If True, include implicit operands in the list
        :return: A list of source operands
        """
        res = []
        for o in self.operands:
            if o.src:
                res.append(o)
        if include_implicit:
            for o in self.implicit_operands:
                if o.src:
                    res.append(o)
        return res

    def get_dest_operands(self, include_implicit: bool = False) -> List[AnyOperand]:
        """
        Get a list of destination operands of the instruction.
        :param include_implicit: If True, include implicit operands in the list
        :return: A list of destination operands
        """
        res = []
        for o in self.operands:
            if o.dest:
                res.append(o)
        if include_implicit:
            for o in self.implicit_operands:
                if o.dest:
                    res.append(o)
        return res

    def get_mem_operands(self,
                         include_explicit: bool = True,
                         include_implicit: bool = False) -> List[MemoryOp]:
        """
        Get a list of memory operands of the instruction.
        :param include_implicit: If True, include implicit operands in the list
        :return: A list of memory operands
        """
        assert include_explicit or include_implicit, "At least one of include_explicit or " \
                                                     "include_implicit must be True"
        res = []
        if include_explicit:
            for o in self.operands:
                if isinstance(o, MemoryOp):
                    res.append(o)
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, MemoryOp):
                    res.append(o)
        return res

    def get_flags_operand(self) -> Optional[FlagsOp]:
        """
        Get the flags operand of the instruction.
        :return: The flags operand, or None if the instruction does not have one
        """
        for o in self.implicit_operands:
            if isinstance(o, FlagsOp):
                return o
        for o in self.operands:
            if isinstance(o, FlagsOp):
                return o
        return None

    def get_reg_operands(self, include_implicit: bool = False) -> List[RegisterOp]:
        """
        Get a list of register operands of the instruction.
        :param include_implicit: If True, include implicit operands in the list
        :return: A list of register operands
        """
        res = []
        for o in self.operands:
            if isinstance(o, RegisterOp):
                res.append(o)
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, RegisterOp):
                    res.append(o)
        return res

    def get_cond_operand(self) -> Optional[CondOp]:
        """
        Get the condition operand of the instruction.
        :return: The condition operand, or None if the instruction does not have one
        """
        for o in self.operands:
            if isinstance(o, CondOp):
                return o
        # not checking implicit operands -> conditions must be explicit
        return None

    def get_label_operand(self) -> Optional[LabelOp]:
        """
        Get the label operand of the instruction.
        :return: The label operand, or None if the instruction does not have one
        """
        for o in self.operands:
            if isinstance(o, LabelOp):
                return o
        # not checking implicit operands -> labels must be explicit
        return None

    def get_imm_operands(self, include_implicit: bool = False) -> List[ImmediateOp]:
        """
        Get a list of immediate operands of the instruction.
        :param include_implicit: If True, include implicit operands in the list
        :return: A list of immediate operands
        """
        res = []
        for o in self.operands:
            if isinstance(o, ImmediateOp):
                res.append(o)
        if include_implicit:
            for o in self.implicit_operands:
                if isinstance(o, ImmediateOp):
                    res.append(o)
        return res

    def get_agen_operands(self) -> List[AgenOp]:
        """
        Get a list of address generation operands of the instruction.
        :return: A list of address generation operands
        """
        res = []
        for o in self.operands:
            if isinstance(o, AgenOp):
                res.append(o)
        # not checking implicit operands -> agen must be explicit
        return res

    # ----------------------------------------------------------------------------------------------
    # Instruction in Assembly
    def assign_line_num(self, line_num: int) -> None:
        """ Assign the line number in the source file where the instruction is located. """
        assert self._line_num == -1, "Line number is already assigned"
        self._line_num = line_num

    def line_num(self) -> int:
        """ Get the line number in the source file where the instruction is located. """
        assert self._line_num != -1, "Line number is not assigned"
        return self._line_num

    # ----------------------------------------------------------------------------------------------
    # Instruction in Binary
    def assign_binary_properties(self, section_id: int, offset: int, size: int) -> None:
        """
        Assign properties of the instruction in the binary file after it has been assembled.
        :param section_id: The ID of the section in the object file where the instruction is located
        :param offset: The section offset of the instruction in the object file
        :param size: The size of the instruction in bytes, after it has been assembled
        """
        assert self._section_id == -1, "Instruction properties are already assigned \n" \
            "    (assign_binary_properties() can only be called once)"
        self._section_id = section_id
        self._section_offset = offset
        self._size = size

    def section_id(self) -> int:
        """ Get the ID of the section in the object file where the instruction is located. """
        assert self._section_id != -1, "Instruction properties are not assigned \n" \
            "    (assign_binary_properties() must be called before section_id() can be used)"
        return self._section_id

    def section_offset(self) -> int:
        """ Get the section offset of the instruction in the object file. """
        assert self._section_offset != -1, "Instruction properties are not assigned \n" \
            "    (assign_binary_properties() must be called before section_offset() can be used)"
        return self._section_offset

    def size(self) -> int:
        """ Get the size of the instruction in bytes. """
        assert self._size != -1, "Instruction properties are not assigned \n" \
            "    (assign_binary_properties() must be called before size() can be used)"
        return self._size


def copy_inst_with_modification(instruction: Instruction,
                                name: Optional[str] = None,
                                category: Optional[str] = None,
                                is_control_flow: Optional[bool] = None,
                                is_instrumentation: Optional[bool] = None,
                                is_noremove: Optional[bool] = None) -> Instruction:
    """
    Make a copy of an instruction with modifications to its properties
    :param instruction: The instruction to copy
    :param name: If not None, the new name of the instruction
    :param category: If not None, the new category of the instruction
    :param is_control_flow: If not None, the new is_control_flow property of the instruction
    :param is_instrumentation: If not None, the new is_instrumentation property of the instruction
    :param is_noremove: If not None, the new is_noremove property of the instruction
    :return: The new modified instruction
    """
    if name is None:
        name = instruction.name
    if category is None:
        category = instruction.category
    if is_control_flow is None:
        is_control_flow = instruction.is_control_flow
    if is_instrumentation is None:
        is_instrumentation = instruction.is_instrumentation
    if is_noremove is None:
        is_noremove = instruction.is_noremove

    new_inst = Instruction(name, category, is_control_flow, is_instrumentation, is_noremove)
    new_inst.is_from_template = instruction.is_from_template
    new_inst.is_macro_placeholder = instruction.is_macro_placeholder
    new_inst.operands.extend(instruction.operands.copy())
    new_inst.implicit_operands.extend(instruction.implicit_operands.copy())
    new_inst._section_id = instruction._section_id  # pylint: disable=protected-access
    new_inst._section_offset = instruction._section_offset  # pylint: disable=protected-access
    new_inst._size = instruction._size  # pylint: disable=protected-access
    new_inst._line_num = instruction._line_num  # pylint: disable=protected-access

    return new_inst


================================================
FILE: rvzr/tc_components/test_case_binary.py
================================================
"""
File: Classes representing assembled test case code in a binary form (ELF object file).

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import TYPE_CHECKING, Dict, List, NamedTuple, Final, Optional

from .instruction import Instruction
from ..logs import error

if TYPE_CHECKING:
    from .test_case_code import TestCaseProgram

SectionID = int
SymbolType = int
SymbolOffset = int
MacroArgument = int
InstructionMap = Dict[SectionID, Dict[int, Instruction]]


class SymbolTableEntry(NamedTuple):
    """ Symbol in a test case symbol table """

    sid: SectionID
    """ The ID of the section that contains the symbol """

    offset: SymbolOffset
    """ offset: The offset of the symbol in the actor's section """

    type_: SymbolType
    """ type_: The type of the symbol """

    arg: MacroArgument
    """ arg: The argument of the symbol """


SymbolTable = List[SymbolTableEntry]


class TestCaseBinary:
    """
    A class representing the object ELF file (i.e., compiled assembly) of a test case program
    """

    obj_path: Final[str]
    """ Path to the object file generated from the asm_path """

    _symbol_table: Optional[List[SymbolTableEntry]] = None
    """ List of symbols in the test case program """

    _instruction_map: Optional[InstructionMap] = None
    """ Dictionary mapping section ID + offset to the corresponding Instruction object """

    _parent: TestCaseProgram  # The parent test case program
    _obj_is_assembled: bool = False  # Flag indicating whether the object file has been assembled

    def __init__(self, obj_path: str, parent: TestCaseProgram):
        self.obj_path = obj_path
        self._parent = parent

    def mark_as_assembled(self) -> None:
        """ Mark the object file as assembled """
        self._obj_is_assembled = True

    def to_bytes(self, padded_section_size: int = 0, padding_byte: bytes = b'') -> bytes:
        """ Return the full binary of the assembled object file, with sections ordered by actor ID.
        Optionally, pad each section to a specified size with a specified padding byte.

        :param pad_to_size: The size to pad each section to
        :param padding_byte: The byte to use for padding
        :return: A list of byte strings, each containing the full compiled binary of a section
        """
        assert self._obj_is_assembled, \
            "Attempting to read sections from an non-assembled object file"
        assert padded_section_size == 0 or len(padding_byte) == 1, \
            "padding_byte must be specified as a single byte if pad_to_size is set"

        code = b''
        with open(self.obj_path, 'rb') as bin_file:
            for actor in self._parent.get_actors(sorted_=True):

                # Read the section from the object file
                section_data = actor.code_section().get_elf_data()
                offset = section_data["offset"]
                size = section_data["size"]

                bin_file.seek(offset)
                code += bin_file.read(size)

                # Apply padding
                assert padded_section_size >= size, \
                    "Padded section size is less than to the original section size"
                if padded_section_size > size:
                    padding = padded_section_size - size
                    code += padding_byte * padding

        return code

    def get_macro_offset(self, macro_type: int) -> int:
        """ Return the offset of the macro of the given type in its section.
        If there are multiple macros of the same type, the first one is returned.
        :param macro_id: The ID of the macro
        :return: The offset of the macro in the object file; -1 if not found
        """
        assert self._symbol_table is not None, \
            "assign_elf_data() has not been called on this object"
        for symbol in self._symbol_table:
            if symbol.type_ == macro_type:
                return symbol.offset
        return -1

    def assign_elf_data(self, symbol_table: List[SymbolTableEntry],
                        instruction_map: InstructionMap) -> None:
        """
        Assign the symbol table and instruction map based on the data parsed from the ELF file
        (normally assigned by an ELFParser instance).
        """
        assert self._symbol_table is None, "Attempting to reassign symbol table"
        assert self._instruction_map is None, "Attempting to reassign instruction map"
        self._symbol_table = symbol_table
        self._instruction_map = instruction_map

    def symbol_table(self) -> List[SymbolTableEntry]:
        """ Return the symbol table of the test case program """
        assert self._symbol_table is not None, "Symbol table has not been populated"
        return self._symbol_table

    def instruction_map(self) -> InstructionMap:
        """ Return the instruction map of the test case program """
        assert self._instruction_map is not None, "Instruction map has not been populated"
        return self._instruction_map

    def save_rcbf(self, path: str) -> None:
        """
        Save the test case binary in the RCBF format
        (see docs/devel/binary-formats.md for details).
        :param path: The path to save the RCBF file to
        """
        assert self._obj_is_assembled, "Attempting to save an un-assembled object file"
        actors = self._parent.get_actors(sorted_=True)
        symbol_table = self.symbol_table()

        # sanity check
        if any(symbol.type_ < 0 for symbol in symbol_table):
            error("attempt to use template as a test case")

        # write the RCBF file
        with open(path, 'wb') as f:
            # header
            f.write((len(actors)).to_bytes(8, byteorder='little'))  # n_actors
            f.write((len(symbol_table)).to_bytes(8, byteorder='little'))  # n_symbols

            # actor metadata
            for actor in actors:
                f.write((actor.get_id()).to_bytes(8, byteorder='little'))
                f.write((actor.mode.value).to_bytes(8, byteorder='little'))
                f.write((actor.privilege_level.value).to_bytes(8, byteorder='little'))
                f.write((actor.data_properties).to_bytes(8, byteorder='little'))
                f.write((actor.data_ept_properties).to_bytes(8, byteorder='little'))
                f.write((0).to_bytes(8, byteorder='little'))  # unused

            # symbol table (first functions sorted by argument, then macros sorted by actor+offset)
            function_symbols = [s for s in symbol_table if s[2] == 0]
            macro_symbols = [s for s in symbol_table if s[2] != 0]
            for aid, s_offset, s_id, arg in sorted(function_symbols, key=lambda s: s.arg):
                # print("function", s_id, aid, s_offset, arg)
                f.write((aid).to_bytes(8, byteorder='little'))
                f.write((s_offset).to_bytes(8, byteorder='little'))
                f.write((s_id).to_bytes(8, byteorder='little'))
                f.write((arg).to_bytes(8, byteorder='little'))
            for aid, s_offset, s_id, arg in sorted(macro_symbols, key=lambda s: (s.sid, s.offset)):
                # print("macro", aid, s_offset, s_id, arg)
                f.write((aid).to_bytes(8, byteorder='little'))
                f.write((s_offset).to_bytes(8, byteorder='little'))
                f.write((s_id).to_bytes(8, byteorder='little'))
                f.write((arg).to_bytes(8, byteorder='little'))

            # section metadata
            for actor in actors:
                section_data = actor.code_section().get_elf_data()
                # print("section\n")
                f.write((section_data["id"]).to_bytes(8, byteorder='little'))
                f.write((section_data["size"]).to_bytes(8, byteorder='little'))
                f.write((0).to_bytes(8, byteorder='little'))

            # code
            with open(self.obj_path, 'rb') as bin_file:
                for actor in actors:
                    section_data = actor.code_section().get_elf_data()
                    bin_file.seek(section_data["offset"])  # type: ignore
                    # print(code, section.size)
                    f.write(bin_file.read(section_data["size"]))

            # print(self.obj_path, f.tell())


================================================
FILE: rvzr/tc_components/test_case_code.py
================================================
"""
File: Class representing test case code and its components.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations

from typing import List, Dict, Optional, Final, TypedDict, Generator as GeneratorType
from dataclasses import dataclass
import shutil

from .actor import Actor, ActorID, ActorName, ActorPL, ActorMode
from .instruction import Instruction
from .test_case_binary import TestCaseBinary


# ==================================================================================================
# Program Structure: CodeSection -> Function -> BasicBlock -> InstructionNode -> Instruction
# ==================================================================================================
@dataclass
class InstructionNode:
    """
    Wrapper class to represent an instruction as a node
    in a double-linked list that constitutes a basic block
    """
    instruction: Final[Instruction]
    """ Wrapped instruction object """

    parent: Final[BasicBlock]
    """ Basic block to which the instruction belongs """

    next: Optional[InstructionNode] = None
    """ Next instruction in the basic block """

    previous: Optional[InstructionNode] = None
    """ Previous instruction in the basic block """

    def __init__(self, instruction: Instruction, parent: BasicBlock):
        self.instruction = instruction
        self.parent = parent
        self.next = None
        self.previous = None

    def __str__(self) -> str:
        return str(self.instruction)


class BasicBlock:
    """ Basic block in the test case code """

    name: Final[str]
    """ The name (i.e., label) of the basic block """

    parent: Final[Optional[Function]]
    """ The function that owns the basic block """

    successors: List[BasicBlock]
    """ List of basic blocks that are successors of this basic block """

    terminators: List[Instruction]
    """ List of terminator instructions in the basic block """

    is_exit: Final[bool]
    """ Indicates whether the basic block should be treated as a function exit block """

    _start: Optional[InstructionNode] = None
    _end: Optional[InstructionNode] = None

    def __init__(self, name: str, parent: Optional[Function] = None, is_exit: bool = False):
        self.name = name
        self.parent = parent
        self.is_exit = is_exit
        self.successors = []
        self.terminators = []

    def __str__(self) -> str:
        return self.name

    def __len__(self) -> int:
        """ Length of the basic block is the number of instructions in it """
        count = 0
        if self._start:
            node = self._start
            count = 1
            while node.next:
                node = node.next
                count += 1
        return count

    def __iter__(self) -> GeneratorType[Instruction, None, None]:
        """ Default iterator over the instructions in the basic block """
        current_node = self._start
        while current_node:
            yield current_node.instruction
            current_node = current_node.next

    def iter_nodes(self) -> GeneratorType[InstructionNode, None, None]:
        """ Non-default iterator: Iterate over the nodes in the basic block """
        current_node = self._start
        while current_node:
            yield current_node
            current_node = current_node.next

    def get_owner(self) -> Actor:
        """ Get the actor that owns the basic block """
        assert self.parent is not None, "Basic block does not have a parent function"
        return self.parent.parent.owner

    # ----------------------------------------------------------------------------------------------
    # Instruction insertion and deletion
    def insert_after(self, position: Optional[InstructionNode], inst: Instruction) -> None:
        """ Insert an instruction after a given position node in a basic block
        :param position: If not None, the node after which to insert the new instruction;
                         If None, insert at the _end of the basic block
        :param inst: The instruction to insert
        :return: None
        :raises ValueError: If `position` is not found in the basic block
        """
        inst_node = InstructionNode(inst, self)

        # Position is None and the BB is empty: set the start and end to the new instruction
        if position is None and self._end is None:
            self._start = inst_node
            self._end = inst_node
            return

        # Position is None and the BB is not empty: set the position to the end of the BB
        if position is None:
            position = self._end
        assert position is not None

        # Position is not None: ensure that `position` belongs to this BB
        if position.parent != self:
            raise ValueError("`position` not found in the basic block")

        # Insert the new instruction
        next_ = position.next
        position.next = inst_node
        inst_node.previous = position
        if next_:
            inst_node.next = next_
            next_.previous = inst_node
        else:
            self._end = inst_node

    def insert_before(self, position: Optional[InstructionNode], inst: Instruction) -> None:
        """ Insert an instruction before a given position node in a basic block
        :param position: If not None, the node before which to insert the new instruction;
                         If None, insert at the beginning of the basic block
        :param inst: The instruction to insert
        :return: None
        :raises ValueError: If `position` is not found in the basic block
        """
        inst_node = InstructionNode(inst, self)

        # Position is None and the BB is empty: set the start and end to the new instruction
        if position is None and self._start is None:
            self._start = inst_node
            self._end = inst_node
            return

        # Position is None and the BB is not empty: set the position to the start of the BB
        if position is None:
            position = self._start
        assert position is not None

        # Position is not None: ensure that `position` belongs to this BB
        if position.parent != self:
            raise ValueError(f"instruction {position} belongs to {position.parent}, not {self}")

        # Insert the new instruction
        previous = position.previous
        position.previous = inst_node
        inst_node.next = position
        if previous:
            inst_node.previous = previous
            previous.next = inst_node
        else:
            self._start = inst_node

    def delete(self, target: InstructionNode) -> None:
        """
        Delete a node from a basic block
        :param target: The node to delete
        :return: None
        :raises ValueError: If the node does not belong to the basic block
        """
        # Verify that this node indeed belongs to this BB
        if target.parent != self:
            raise ValueError("Error deleting an instruction from a BB; instruction not found")

        # Patch the linked list
        previous = target.previous
        next_ = target.next
        if previous is None and next_ is None:  # the only instruction in BB
            self._end = None
            self._start = None
        elif previous is None:  # the first instruction
            next_.previous = None  # type: ignore
            self._start = next_
        elif next_ is None:  # the last instruction
            previous.next = None
            self._end = previous
        else:  # somewhere in the middle
            previous.next = next_
            next_.previous = previous

    # ----------------------------------------------------------------------------------------------
    # Instruction access
    def get_first(self, exclude_macros: bool = False) -> Optional[InstructionNode]:
        """
        Get the first InstructionNode in the basic block
        :param exclude_macros: If True, return the first non-macro instruction
        :return: The first node or None if the basic block is empty
        """
        if not exclude_macros:
            return self._start if self._start is not None else None

        # Skip macro instructions
        entry_node = self.get_first()
        while entry_node:
            if entry_node.instruction.name != "macro":
                break
            entry_node = entry_node.next
        return entry_node

    def get_last(self) -> Optional[InstructionNode]:
        """ Get the last InstructionNode in the basic block
        :return: The last node or None if the basic block is empty
        """
        return self._end if self._end is not None else None

    def find_instruction_node(self, inst: Instruction) -> Optional[InstructionNode]:
        """
        Find a InstructionNode in the basic block that corresponds to a given instruction
        :param inst: The instruction to find
        :return: The node corresponding to the instruction or None if not found
        """
        for node in self.iter_nodes():
            if node.instruction == inst:
                return node
        return None


class Function:
    """
    Function in the test case code.
    This class is essentially a wrapper around a list of basic blocks, with special features:
    * The basic blocks are ordered by their appearance in the assembly code.
    * The last basic block has special handling: it is assumed to be the exit block of the function,
      and it should contain little-to-no instructions. IMPORTANT: This basic block
      is NOT included when iterating over the basic blocks in the function
      or when calculating its length.
    """

    name: Final[str]
    """ The name of the function; matches the function label in the assembly code """

    parent: Final[CodeSection]
    """ The actor that owns the function"""

    _all_bb: List[BasicBlock]
    """ List of all basic blocks in the function, ordered by their appearance in asm """

    def __init__(self, name: str, parent: CodeSection):
        self.name = name
        self.parent = parent
        exit_bb = BasicBlock(f".exit_{name.removeprefix('.function_')}", parent=self, is_exit=True)
        self._all_bb = [exit_bb]

    def __len__(self) -> int:
        """ Length of the function is the number of basic blocks in it, excluding the exit block """
        return len(self._all_bb[:-1])

    def __iter__(self) -> GeneratorType[BasicBlock, None, None]:
        """ Iterate over the basic blocks in the function, excluding the exit block """
        for bb in self._all_bb[:-1]:
            yield bb

    def __getitem__(self, id_: int) -> BasicBlock:
        """ Get a basic block by its index, excluding the exit block """
        assert len(self._all_bb) > 1, "Function has no non-exit basic blocks"
        non_exit_bbs = self._all_bb[:-1]
        return non_exit_bbs[id_]

    def append(self, bb: BasicBlock) -> None:
        """ Append a basic block to the second-to-last position in the function
          (the last is always exit) """
        exit_bb = self._all_bb.pop()
        self._all_bb.append(bb)
        self._all_bb.append(exit_bb)

    def extend(self, bb_list: List[BasicBlock]) -> None:
        """ Extend the function with a list of basic blocks (added to the end) """
        exit_bb = self._all_bb.pop()
        self._all_bb.extend(bb_list)
        self._all_bb.append(exit_bb)

    def get_first_bb(self) -> BasicBlock:
        """ Get the first basic block in the function.
        If there are no basic blocks, return the default exit block.
        """
        return self._all_bb[0]

    def get_exit_bb(self) -> BasicBlock:
        """ Get the last basic block in the function.
        If there are no basic blocks, return the default exit block.
        """
        exit_ = self._all_bb[-1]
        assert exit_.is_exit, "The last basic block is not marked as an exit block"
        return self._all_bb[-1]

    def get_owner(self) -> Actor:
        """ Get the actor that owns the function """
        return self.parent.owner


class _ELFSectionData(TypedDict):
    """ Data of a section in the ELF file """
    offset: int
    size: int
    id: int


class CodeSection:
    """
    Section in the test case code.
    This class is essentially a wrapper around an ordered list of functions, with special features:
    * The functions are ordered by their appearance in the assembly code.
    """

    name: Final[str]
    """ The name of the section """

    owner: Actor
    """ The actor that owns the section """

    id_: Optional[int] = None
    """ ID of the section; must match the ID in the ELF file """

    _functions: Final[List[Function]]  # List of functions in the section
    _bin_offset: Optional[int] = None  # Offset of the section in the object file
    _bin_size: Optional[int] = None  # Size of the section in the object file

    def __init__(self, owner: Actor):
        self.owner = owner
        self.name = owner.name
        owner.assign_code_section(self)
        self._functions = []

    def __iter__(self) -> GeneratorType[Function, None, None]:
        """ Iterate over the functions in the section """
        for func in self._functions:
            yield func

    def __len__(self) -> int:
        """ Length of the section is the number of functions in it """
        return len(self._functions)

    def __getitem__(self, id_: int) -> Function:
        """ Get a function by its index """
        return self._functions[id_]

    def append(self, func: Function) -> None:
        """ Append a function to the section """
        assert func.name not in [f.name for f in self._functions], \
            f"Function {func.name} already exists in the section"
        self._functions.append(func)

    def assign_elf_data(self, offset: int, size: int, id_: int) -> None:
        """ Assign ELF data to the section """
        assert self._bin_offset is None and self._bin_size is None and self.id_ is None, \
            "ELF data is already assigned"
        self._bin_offset = offset
        self._bin_size = size
        self.id_ = id_

    def get_elf_data(self) -> _ELFSectionData:
        """ Get the ELF data of the section """
        assert self._bin_offset is not None and self._bin_size is not None \
            and self.id_ is not None, "ELF data is not assigned"
        return {"offset": self._bin_offset, "size": self._bin_size, "id": self.id_}


# ==================================================================================================
# All Program Information Combined
# ==================================================================================================
TC_EXIT_LABEL = ".test_case_exit"


class TestCaseProgram:
    """ A class representing a test case program """

    generator_seed: int
    """ Seed used to generate the test case program """

    _asm_path: str  # Path to the assembly file containing the test case program
    _obj: Optional[TestCaseBinary] = None  # Representation of the assembled test case program
    _obj_is_assembled: bool = False  # Flag indicating whether the object file has been assembled

    _sections: Final[List[CodeSection]]  # List of sections in the test case program
    _actors: Dict[ActorName, Actor]  # Dictionary of actors in the test case program
    _tc_exit_bb: Final[BasicBlock]  # Special basic block labeled that terminates the test case

    def __init__(self, asm_path: str, seed: int = 0):
        self.generator_seed = seed
        self._asm_path = asm_path
        self._tc_exit_bb = BasicBlock(TC_EXIT_LABEL)

        self._actors = {"main": Actor.create_main()}
        self._sections = [CodeSection(self._actors["main"])]

    def __len__(self) -> int:
        """ Length of the test case is the number of sections """
        return len(self._sections)

    def __getitem__(self, id_: int) -> CodeSection:
        """ Get a section by its index """
        return self._sections[id_]

    def get_tc_exit_bb(self) -> BasicBlock:
        """ Get the special basic block used to terminate the test case """
        return self._tc_exit_bb

    # ----------------------------------------------------------------------------------------------
    # Iterators
    def __iter__(self) -> GeneratorType[CodeSection, None, None]:
        """ Default iterator over the sections in the test case """
        for sec in self._sections:
            yield sec

    def iter_functions(self) -> GeneratorType[Function, None, None]:
        """ Non-default iterator: Iterate over all functions in the test case """
        for sec in self._sections:
            for func in sec:
                yield func

    def iter_basic_blocks(self) -> GeneratorType[BasicBlock, None, None]:
        """
        Non-default iterator:
        Iterate over all basic blocks in the test case in their order of appearance in the asm file
        """
        for sec in self._sections:
            for func in sec:
                for bb in func:
                    yield bb

    # ----------------------------------------------------------------------------------------------
    # ELF file management
    def assign_obj(self, obj_path: str) -> None:
        """
        Assign an object file generated from the assembly file
        :param obj_path: The path to the object file
        :return: None
        :raises AssertionError: If the object file is already assigned
        """
        assert self._obj is None, "Object file is already assigned"
        self._obj = TestCaseBinary(obj_path, self)

    def mark_as_assembled(self) -> None:
        """ Mark the object file as assembled """
        assert self._obj is not None, "Object file is not assigned"
        self._obj_is_assembled = True
        self._obj.mark_as_assembled()

    def get_obj(self) -> TestCaseBinary:
        """
        Get assigned TestCaseBinary, the container of the object file
        generated from the test case program
        """
        assert self._obj is not None, "Object file is not assigned"
        return self._obj

    # ----------------------------------------------------------------------------------------------
    # ASM file management
    def reassign_asm_file(self, asm_path: str) -> None:
        """ Assign a new assembly file to the test case """
        assert not self._obj_is_assembled, \
            "Attempting to reassign the asm file after it has been assembled"
        self._asm_path = asm_path

    def asm_path(self) -> str:
        """ Get the path to the assigned assembly file """
        return self._asm_path

    def save(self, path: str) -> None:
        """
        Save the test case assembly into a file.
        :param path: The path to the file
        :return: None
        """
        shutil.copy2(self._asm_path, path)

    # ----------------------------------------------------------------------------------------------
    # Actor list management
    def add_actor_with_section(self, actor: Actor, allow_overwrite: bool = False) -> None:
        """
        Add an actor to the test case and assign it an empty CodeSection.

        If an actor with the same name already exists and `allow_overwrite` is True,
        the new actor will overwrite the existing one.
        Otherwise, an error will be raised.
        :param actor: The actor to add
        :param allow_overwrite: Whether to allow overwriting an existing actor
        :return: None
        :raises ValueError: If the actor already exists in the test case
        """
        if not allow_overwrite and actor.name in self._actors:
            raise ValueError(f"Actor {actor.name} already exists in the test case")

        # Update of the main actor
        if actor.is_main:
            assert actor.mode == ActorMode.HOST
            assert actor.privilege_level == ActorPL.KERNEL
            self._actors[actor.name] = actor
            section = self._sections[0]
            section.owner = actor
            actor.assign_code_section(section)
            return

        # Update of an actor
        if allow_overwrite and actor.name in self._actors:
            self._actors[actor.name] = actor
            section = self.find_section(actor.name)
            section.owner = actor
            actor.assign_code_section(section)
            return

        # New actor
        self._actors[actor.name] = actor
        section = CodeSection(actor)
        self._sections.append(section)

    def get_actors(self, sorted_: bool = False) -> List[Actor]:
        """
        Get a list of actors.
        :param sorted: Whether to sort the actors by ID
        :return: A list of actors
        """
        if sorted_:
            return sorted(self._actors.values(), key=lambda x: x.get_id())
        return list(self._actors.values())

    def find_actor(self,
                   name: Optional[ActorName] = None,
                   actor_id: Optional[ActorID] = None) -> Actor:
        """
        Select an actor by name or ID.
        :param name: The name of the actor
        :param actor_id: The ID of the actor
        :return: The actor
        :raises KeyError: If an actor with the given name/ID does not exist in the test case
        :raises ValueError: If neither name nor ID is provided or if both are provided
        """
        # check interface
        assert name is not None or actor_id is not None, "Either name or ID must be provided"
        assert name is None or actor_id is None, "Only one of name or ID should be provided"

        # select by name
        if name is not None:
            if name not in self._actors:
                raise KeyError(f"Actor {name} does not exist in the test case")
            return self._actors[name]

        # select by ID
        for actor in self._actors.values():
            if actor.get_id() == actor_id:
                return actor
        raise KeyError(f"Actor with ID {actor_id} does not exist in the test case")

    def n_actors(self) -> int:
        """
        Get the number of actors in the test case.
        :return: The number of actors
        """
        return len(self._actors)

    # ==============================================================================================
    # Function and section management
    def get_sections(self) -> List[CodeSection]:
        """ Get a list of sections in the test case """
        return self._sections

    def find_section(self, name: str) -> CodeSection:
        """
        Get a section by name
        :param name: The name of the section
        :return: The section
        :raises KeyError: If the section does not exist in the test case
        """
        for sec in self._sections:
            if sec.name == name:
                return sec
        raise KeyError(f"Section {name} does not exist in the test case")

    def find_function(self, name: str) -> Function:
        """
        Get a function by name
        :param name: The name of the function
        :return: The function
        :raises KeyError: If the function does not exist in the test case
        """
        for sec in self._sections:
            for func in sec:
                if func.name == name:
                    return func
        raise KeyError(f"Function {name} does not exist in the test case")


================================================
FILE: rvzr/tc_components/test_case_data.py
================================================
"""
File: Classes representing test case data (aka input), as well as related and derived classes.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import TYPE_CHECKING, Tuple, Optional, List
import numpy as np

from ..sandbox import SandboxLayout, DataArea

if TYPE_CHECKING:
    from .actor import ActorID

InputID = int

# ==================================================================================================
# Per-actor input data
# ==================================================================================================

# _ActorInput data type represents the input for a single actor
_ActorInput = np.dtype(
    [
        ('main', np.uint64, SandboxLayout.data_area_size(DataArea.MAIN) // 8),
        ('faulty', np.uint64, SandboxLayout.data_area_size(DataArea.FAULTY) // 8),
        ('gpr', np.uint64, SandboxLayout.data_area_size(DataArea.GPR) // 8),
        ('simd', np.uint64, SandboxLayout.data_area_size(DataArea.SIMD) // 8),
        ('padding', np.uint64, SandboxLayout.data_area_size(DataArea.OVERFLOW_PAD) // 8),
    ],
    align=False,
)

_ACTOR_DATA_SIZE = _ActorInput['main'].itemsize + _ActorInput['faulty'].itemsize + \
    _ActorInput['gpr'].itemsize + _ActorInput['simd'].itemsize

# ==================================================================================================
# Full input data
# ==================================================================================================
UINT_NDARRAY = np.ndarray[Tuple[int, ...], np.dtype[np.uint64]]


class InputData(UINT_NDARRAY):
    """
    Class representing a single data input for a test case program (TestCaseCode).
    This data is used by the executor and the model to initialize the sandbox memory and registers.
    The input is typically generated by the input generator or parsed from a binary file.

    Internally, this class is a fixed-size numpy.ndarray of 64-bit unsigned integers,
    with a few addition methods for convenience.

    The array is organized as a 1D array of _ActorInput structures (one for each actor in the test
    case program), sorted by actor ID. Each _ActorInput structure contains the input data for a
    single actor, and it's layout mirrors the layout of the initialiable data regions
    of the sandbox.py:SandboxLayout.
    Namely, the Input array is organized as follows:

    |-----|-------------------------------| main
    | A   | sizeof(DataArea.MAIN)         |
    | C   |-------------------------------| faulty
    | T   | sizeof(DataArea.FAULTY)       |
    | O   |-------------------------------| gpr
    | R   | sizeof(DataArea.GPR)          |
    |     |-------------------------------| simd
    | 0   | sizeof(DataArea.SIMD)         |
    |     |-------------------------------| padding
    |     | sizeof(DataArea.OVERFLOW_PAD) |
    |-----|-------------------------------|
    | ... (repeat for n_actors)

    The data in each region could be accesses via the array interface, e.g.,
    actor0_main = Input[0]['main']

    The array size is equal to the number of actors multiplied by
    the number of elements in _ActorInput, i.e.,
        Input.size = n_actors * _ActorInput.size
    """

    seed: int = 0
    """ seed: The seed value used to generate this input """

    # ==============================================================================================
    # Constructors

    def __new__(cls, n_actors: int = 1) -> InputData:
        obj = super().__new__(cls, (n_actors,), _ActorInput, None, 0, None, None)
        return obj

    def __array_finalize__(self, obj: Optional[UINT_NDARRAY]) -> None:  # type: ignore
        # if obj is None:
        #     return
        pass

    # ==============================================================================================
    # Class interface

    @classmethod
    def data_size_per_actor(cls) -> int:
        """
        Get the size (in bytes) of the data area for a single actor.
        :return: Size, in bytes
        """
        return _ACTOR_DATA_SIZE

    @classmethod
    def n_data_entries_per_actor(cls) -> int:
        """
        Get the number of entries in the input array for a single actor.

        Note: This function is NOT equivalent to `data_size_per_actor`.
        This is because array entries are 64-bit integers.
        :return: Number of entries
        """
        return _ACTOR_DATA_SIZE // 8

    # ==============================================================================================
    # Object interface

    def __hash__(self) -> int:  # type: ignore
        # hash of input is a hash of input data, registers and memory
        h = hash(self.tobytes())
        return h

    def __str__(self) -> str:
        return str(self.seed)

    def __repr__(self) -> str:
        return str(self.seed)

    def set_actor_data(self, actor_id: 'ActorID', data: UINT_NDARRAY) -> None:
        """
        Set the data for a single actor.
        :param actor_id: The actor ID
        :param data: The data to set
        :return: None
        :raises AssertionError: If the data array has an unexpected shape
        """
        assert data.shape == (self.itemsize // 8,), \
            "Data shape does not match the expected shape"

        # copy the data
        self[actor_id] = data.view(_ActorInput)

        # zero-fill the unused parts of the input
        self[actor_id]['padding'] = 0

    def save(self, path: str) -> None:
        """
        Save the input to a binary file.
        :param path: The path to the file
        """

        with open(path, 'wb') as f:
            f.write(self.tobytes())

    def load(self, path: str) -> None:
        """
        Load the input from a binary file.
        :param path: The path to the file
        """

        with open(path, 'rb') as f:
            contents = np.fromfile(f, dtype=np.uint64)
            n_actors = self.shape[0]
            for actor_id in range(n_actors):
                actor_start = actor_id * self.itemsize // 8
                actor_end = actor_start + self.itemsize // 8
                self.linear_view(actor_id)[:] = contents[actor_start:actor_end]

    def linear_view(self, actor_id: ActorID) -> UINT_NDARRAY:
        """
        Get a linear view of the input for a single actor;
        that is, a 1D array of 64-bit integers.
        :param actor_id: The actor ID
        :return: A linear view of the input for the actor
        """
        view: UINT_NDARRAY = self[actor_id].view((np.uint64, self[actor_id].itemsize // 8))
        return view


def save_input_sequence_as_rdbf(inputs: List[InputData], path: str) -> None:
    """
    Save the input sequences into an RDBF-formatted file.
    (see docs/devel/binary-formats.md for details on RDBF format).

    :param inputs: The input sequence
    :param path: The path to save the RDBF file to
    :return: None
    """
    n_actors = len(inputs[0]) if len(inputs) > 0 else 1
    with open(path, 'wb') as f:
        # header
        f.write((n_actors).to_bytes(8, byteorder='little'))  # number of actors
        f.write((len(inputs)).to_bytes(8, byteorder='little'))  # number of inputs

        # metadata
        data_size_per_actor_bytes = InputData.data_size_per_actor()
        for _ in range(n_actors):
            f.write((data_size_per_actor_bytes).to_bytes(8, byteorder='little'))  # size
            f.write((0).to_bytes(8, byteorder='little'))  # reserved

        # data
        for input_ in inputs:
            f.write(input_.tobytes())


# ==================================================================================================
# Input taint
# ==================================================================================================

BOOL_NDARRAY = np.ndarray[Tuple[int], np.dtype[np.bool_]]

_ActorInputTaint = np.dtype(
    [
        ('main', np.bool_, _ActorInput['main'].shape[0]),
        ('faulty', np.bool_, _ActorInput['faulty'].shape[0]),
        ('gpr', np.bool_, _ActorInput['gpr'].shape[0]),
        ('simd', np.bool_, _ActorInput['simd'].shape[0]),
        ('padding', np.bool_, _ActorInput['padding'].shape[0]),
    ],
    align=False,
)


class InputTaint(BOOL_NDARRAY):
    """
    Fixed-size boolean array that represents the taint status of a single test case input.
    The array layout is identical to the Input class, with the same number of elements.
    If an element is True, the corresponding element in the Input array is considered tainted.

    The array is used to indicate which input elements influence contract traces.
    """

    per_actor_taint_size: int = _ActorInputTaint.itemsize
    """ per_actor_taint_size: The size of the taint area for a single actor """

    def __new__(cls, n_actors: int = 1) -> InputTaint:
        obj = super().__new__(cls, (n_actors,), _ActorInputTaint, None, 0, None, None)
        obj.fill(False)
        return obj

    def __array_finalize__(self, obj: Optional[UINT_NDARRAY]) -> None:  # type: ignore
        # if obj is None:
        #     return
        pass

    def linear_view(self, actor_id: 'ActorID') -> BOOL_NDARRAY:
        """
        Get a linear view of the taint for a single actor;
        that is, a 1D array of booleans.
        :param actor_id: The actor ID
        :return: A linear view of the taint for the actor
        """
        view: BOOL_NDARRAY = self[actor_id].view((np.bool_, self[actor_id].itemsize))
        return view

    def full_linear_view(self) -> np.ndarray[Tuple[int, ...], np.dtype[np.bool_]]:
        """
        Get a linear view of the taint for all actors;
        that is, a 1D array of booleans.
        :return: A linear view of the taint for all actors
        """
        view = self.view(np.bool_)
        return view

    def taint_actor_offsets(self, actor_id: 'ActorID', offsets: List[int]) -> None:
        """
        Taint a list of locations in the input of a single actor as tainted. The locations are
        specified as offsets in the _ActorInput structure.
        :param actor_id: The actor ID
        :param offsets: A list of offsets
        :return: None
        """
        actor_view = self.linear_view(actor_id)
        for offset in offsets:
            actor_view[offset] = True

    @classmethod
    def taint_offset_from_sandbox_address(cls, sb_address: int) -> int:
        """
        This function exists to cover the mismatch between the sandbox layout (sandbox.py) and
        the InputTaint layout (this class).

        The function computes the offset in the InputTaint structure from a given sandbox address
        by subtracting the missing padding.

        :param sb_address: The sandbox address
        :return: The offset in the InputTaint structure
        """
        per_actor_sandbox_size = SandboxLayout.data_size_per_actor()
        actor_id = sb_address // per_actor_sandbox_size
        sandbox_offset = sb_address % per_actor_sandbox_size
        taint_offset = sandbox_offset - SandboxLayout.data_area_size(DataArea.MAIN)
        return taint_offset // 8 + (actor_id * cls.per_actor_taint_size)


================================================
FILE: rvzr/traces.py
================================================
"""
File: Classes representing contract and hardware traces as well as derived containers thereof.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from collections import Counter

from typing import List, Optional, Final, NamedTuple, Tuple, Dict, Generator, Callable, Literal
from typing_extensions import assert_never

import xxhash
import numpy as np
import numpy.typing as npt

from .tc_components.test_case_data import InputData, InputID
from .tc_components.test_case_code import TestCaseProgram
from .config import CONF

_REG_ID_TO_NAME_X86 = {0: "rax", 1: "rbx", 2: "rcx", 3: "rdx", 4: "rsi", 5: "rdi"}
_REG_ID_TO_NAME_ARM = {0: "x0", 1: "x1", 2: "x2", 3: "x3", 4: "x4", 5: "x5"}

# ==================================================================================================
# Contract Trace
# ==================================================================================================
CTraceEntryType = Literal["mem", "pc", "val", "reg", "ind"]


class CTraceEntry(NamedTuple):
    """
    Named tuple that represents a single entry in a contract trace.
    """
    type_: CTraceEntryType
    value: int


UntypedCTrace = List[int]


class CTrace:
    """
    Class representing a contract trace. It encapsulates a list of integers that represent a raw
    trace collected from the model, and it provides basic comparison and hashing interfaces that
    allow to compare traces for equality and to store them in sets or dictionaries.
    """
    _trace: Final[List[CTraceEntry]]
    _untyped: Final[UntypedCTrace]
    _hash: Final[int]

    _printed_as_l1d_map: bool = False
    """ Flag indicating that the trace should be printed  """

    # ==============================================================================================
    # Constructors

    @classmethod
    def empty_trace(cls) -> CTrace:
        """ Produce a dummy CTrace object with empty raw trace """
        return cls([])

    def __init__(self, trace: List[CTraceEntry]) -> None:
        self._trace = trace
        self._untyped = [entry.value for entry in trace]
        self._hash = xxhash.xxh64(str(self._untyped), seed=0).intdigest()

    # ==============================================================================================
    # Printers

    def __str__(self) -> str:
        # For most cases, just print the hash value
        if not self._printed_as_l1d_map:
            return str(self._hash)

        # When printing as L1D map was requested, print the trace as a 64-bit bit mask
        # representing the cache state
        map_value = 0
        for address in self._untyped:
            page_offset = (address & 0b111111000000) >> 6
            cache_set_index = 0x8000000000000000 >> page_offset
            map_value |= cache_set_index
        map_str = f"{map_value:064b}"
        map_str = map_str.replace("0", ".").replace("1", "^")
        return map_str

    def full_str(self,
                 m_col: str = "",
                 pc_col: str = "",
                 val_col: str = "",
                 reset_col: str = "") -> str:
        """
        Return a string representation of the complete typed trace.
        Optionally, the colors can be specified for memory addresses, program counters, and values.

        Example output: [mem: 0x100, pc: 0x200, val: 0x300]

        :param m_col: color for memory addresses entries
        :param pc_col: color for program counters entries
        :param val_col: color for values entries
        :param reset_col: color reset string
        :return: colorized string representation of the trace
        """
        assert reset_col or not (m_col or pc_col or val_col), \
            "If any color is set, reset_col must be set as well"

        s = "["
        len_ = len(self._trace)
        reg_names = _REG_ID_TO_NAME_X86 if CONF.instruction_set == "x86-64" else _REG_ID_TO_NAME_ARM
        for i, item in enumerate(self._trace):
            if item.type_ == "mem":
                s += "mem: " + m_col + hex(item.value) + reset_col
            elif item.type_ == "pc":
                s += "pc: " + pc_col + hex(item.value) + reset_col
            elif item.type_ == "ind":
                s += "indcall: " + pc_col + hex(item.value) + reset_col
            elif item.type_ == "val":
                s += "val: " + val_col + hex(item.value) + reset_col
            elif item.type_ == "reg":
                name = reg_names[i]
                s += name + ": " + hex(item.value) + reset_col
            else:
                assert_never(item.type_)
            if i != len_ - 1:
                s += ", "
        return s + "]"

    # ==============================================================================================
    # Public Methods

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, CTrace):
            raise NotImplementedError("Cannot compare CTrace with non-CTrace object")
        return self._hash == other._hash

    def __lt__(self, other: CTrace) -> bool:
        return self._hash < other._hash

    def __gt__(self, other: CTrace) -> bool:
        return self._hash > other._hash

    def __len__(self) -> int:
        return len(self._untyped)

    def __hash__(self) -> int:
        return self._hash

    def is_empty(self) -> bool:
        """ Check if the trace was created from an empty list or via `empty_trace()` """
        return len(self) == 0

    def get_untyped(self) -> UntypedCTrace:
        """
        Get a raw trace containing only integers values of the CTrace without type information
        """
        return self._untyped

    def get_typed(self) -> List[CTraceEntry]:
        """ Get the full trace used to construct the CTrace object """
        return self._trace

    def set_printed_as_l1d(self, val: bool = True) -> None:
        """
        Set the flag indicating that the trace should be printed as L1D map.
        This is normally used only for debugging purposes.
        :param val: flag value
        :return: None
        """
        self._printed_as_l1d_map = val


# ==================================================================================================
# Hardware Trace
# ==================================================================================================
HTraceType = Literal["cache", "tsc", "reg"]

RawHTraceSample = np.dtype([
    ("trace", np.uint64),
    ("pfc0", np.uint64),
    ("pfc1", np.uint64),
    ("pfc2", np.uint64),
    ("pfc3", np.uint64),
    ("pfc4", np.uint64),
])
ArrayOfSamples = npt.NDArray[np.void]
PFCTuple = Tuple[int, int, int, int, int]


class HTrace:
    """
    Class representing a sequence of hardware trace samples. The samples are normally received from
    the executor: It executes a test case program with a given input multiple times, and each
    execution produces a single hardware trace and a set of readings from performance counters.
    The results of such repeated executions are collected into a single HTrace object.
    """
    _raw: Final[ArrayOfSamples]
    _hash: Final[int]
    _is_corrupted_or_ignored: Final[bool]
    _max_pfc: Optional[PFCTuple] = None
    type_: Final[HTraceType]

    # ==============================================================================================
    # Constructors

    @classmethod
    def empty_trace(cls, type_: HTraceType = "cache") -> HTrace:
        """ Get a dummy HTrace object with empty hardware trace and zeros for perf counters """
        return cls(np.ndarray(0, dtype=RawHTraceSample), type_)

    @classmethod
    def invalid_trace(cls, type_: HTraceType = "cache") -> HTrace:
        """ Get a dummy HTrace object with corrupted hardware trace and zeros for perf counters """
        invalid_sample: npt.NDArray[np.void] = np.zeros(1, dtype=RawHTraceSample)
        return cls(invalid_sample, type_)

    def __init__(self, htrace_samples: ArrayOfSamples, type_: HTraceType = "cache") -> None:
        # check that the input has the expected shape
        assert htrace_samples.ndim == 1, "htrace_samples must be a 1D array"
        assert htrace_samples.dtype == RawHTraceSample, "htrace_samples must be of type RawHTrace"

        # store and process the samples
        self._raw = htrace_samples
        self._hash = xxhash.xxh64(str(htrace_samples['trace']), seed=0).intdigest()
        self._is_corrupted_or_ignored = all(x == 0 for x in htrace_samples['trace'])
        self.type_ = type_

    # ==============================================================================================
    # Printers

    def __str__(self) -> str:
        return str(self._hash)

    def full_str(self,
                 line_prefix: str = "",
                 region1_col: str = "",
                 region2_col: str = "",
                 reset_col: str = "") -> str:
        """
        Return a string (table) representation of the set of samples used to create this trace

        :param line_prefix: string to prepend to each line
        :return: string representation of the trace
        """
        # Nothing to print if the trace is empty
        if self.is_empty():
            return line_prefix
        if self.type_ == "cache":
            return self._full_cache_str(line_prefix, region1_col, region2_col, reset_col)
        if self.type_ == "tsc":
            return self._full_tsc_str(line_prefix)
        if self.type_ == "reg":
            return self._full_arch_str(line_prefix)

        assert_never(self.type_)
        return ""  # pylint: disable=unreachable

    def _full_arch_str(self, line_prefix: str) -> str:
        """ Return a string representation of an architectural trace.
        Example output:
        [rax:0x00000000000001, rbx:0x00000000000002, rcx:0x00000000000003, rdx:0x00000000000004,
        rsi:0x00000000000005, rdi:0x00000000000006]
        """
        assert len(self._raw) == 1, "Invalid trace shape"
        s = line_prefix
        reg_names = _REG_ID_TO_NAME_X86 if CONF.instruction_set == "x86-64" else _REG_ID_TO_NAME_ARM
        s += "["
        s += f"{reg_names[0]}: 0x{self._raw[0]['trace']:x}, "
        s += f"{reg_names[1]}: 0x{self._raw[0]['pfc0']:x}, "
        s += f"{reg_names[2]}: 0x{self._raw[0]['pfc1']:x}, "
        s += f"{reg_names[3]}: 0x{self._raw[0]['pfc2']:x}, "
        s += f"{reg_names[4]}: 0x{self._raw[0]['pfc3']:x}, "
        s += f"{reg_names[5]}: 0x{self._raw[0]['pfc4']:x}"
        s += "]"
        return s

    def _full_tsc_str(self, line_prefix: str) -> str:
        """ Return a string representation of a TSC trace.
        Example output:
        00000001 [16]
        00000002 [16]
        """
        s = ""
        mask = np.uint64(0xFFFFFFFFFFFFFF)
        counter = Counter(self._raw['trace'])
        trace_distribution = sorted(counter.items(), key=lambda x: x[1], reverse=True)
        for t, c in trace_distribution:
            t = t & mask
            s += f"{line_prefix}{t:08} [{c}]\n"
        return s

    def _full_cache_str(self, line_prefix: str, r1_col: str, r2_col: str, reset_col: str) -> str:
        """ Return a string representation of a cache trace
        Example output:
            .....^..................^....................................... [16]
            ........................^....................................... [16]
        """
        s = ""
        counter = Counter(self._raw['trace'])
        trace_distribution = sorted(counter.items(), key=lambda x: x[1], reverse=True)
        for t, c in trace_distribution:
            line = f"{t:064b}"
            line = line.replace("0", ".").replace("1", "^")
            line = r1_col + line[0:8] + r2_col + line[8:16] \
                + r1_col + line[16:24] + r2_col + line[24:32] \
                + r1_col + line[32:40] + r2_col + line[40:48] \
                + r1_col + line[48:56] + r2_col + line[56:64] \
                + reset_col + line[64:]
            s += f"{line_prefix}{line} [{c}]\n"
        return s

    def full_pair_str(self,
                      other: HTrace,
                      r1_col: str = "",
                      r2_col: str = "",
                      res_col: str = "") -> str:
        """ Return a string representation of two sample distributions side-by-side"""
        if self.type_ == "cache":
            assert other.type_ == "cache"
            return self._full_cache_pair_str(other, r1_col, r2_col, res_col)
        if self.type_ == "tsc":
            assert other.type_ == "tsc"
            return self._full_tsc_pair_str(other)
        if self.type_ == "reg":
            raise NotImplementedError("Cannot compare architectural traces")

        assert_never(self.type_)
        return ""  # pylint: disable=unreachable

    def _full_tsc_pair_str(self, other: HTrace) -> str:
        """ Return a string representation of two TSC sample distributions side-by-side
        Example output:
        00000001        |16     | 8      |
        00000002        |16     | 24     |
        """
        mask = np.uint64(0xFFFFFFFFFFFFFF)
        c1 = Counter(self.get_raw_traces())
        c2 = Counter(other.get_raw_traces())
        keys = set(c1.keys()) | set(c2.keys())
        traces = sorted(keys, key=lambda x: (c1[x] << 10000) + c2[x], reverse=True)

        final_str = ""
        for t in traces:
            t = t & mask
            final_str += f"{t:08} | {c1[t]:<6} | {c2[t]:<6} |\n"
        return final_str

    def _full_cache_pair_str(self, other: HTrace, r1_col: str, r2_col: str, res_col: str) -> str:
        """ Return a string representation of two cache sample distributions side-by-side
        Example output:
        .....^..................^....................................... |16     | 8      |
        .....^.......................................................... |16     | 24     |
        """
        c1 = Counter(self.get_raw_traces())
        c2 = Counter(other.get_raw_traces())
        keys = set(c1.keys()) | set(c2.keys())
        traces = sorted(keys, key=lambda x: (c1[x] << 10000) + c2[x], reverse=True)

        final_str = ""
        for t in traces:
            s = f"{t:064b}"
            s = s.replace("0", ".").replace("1", "^")
            s = r1_col + s[0:8] + r2_col + s[8:16] \
                + r1_col + s[16:24] + r2_col + s[24:32] \
                + r1_col + s[32:40] + r2_col + s[40:48] \
                + r1_col + s[48:56] + r2_col + s[56:64] \
                + res_col + s[64:]
            final_str += s + f" | {c1[t]:<6} | {c2[t]:<6}|\n"
        return final_str

    # ==============================================================================================
    # Public Methods

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, HTrace):
            raise NotImplementedError("Cannot compare HTrace with non-HTrace object")
        return self._hash == other._hash

    def __len__(self) -> int:
        return len(self._raw)

    def __hash__(self) -> int:
        return self._hash

    def merge(self, other: HTrace) -> HTrace:
        """
        Merge two HTrace objects into a single HTrace object
        :param other: HTrace object to merge with
        :return: A new HTrace object that contains all samples from both objects
        """
        samples = np.concatenate([self._raw, other._raw])  # pylint: disable=protected-access
        return HTrace(samples, self.type_)

    def is_empty(self) -> bool:
        """ Check if the trace was created from an empty sample or via `empty_trace()` """
        return len(self) == 0

    def is_corrupted_or_ignored(self) -> bool:
        """
        Check if the trace was created from a corrupted sample.
        A corrupted sample is a sample were all values are zero, which is a way that executor
        signals that the trace was not collected properly.
        """
        return self._is_corrupted_or_ignored

    def get_raw_readings(self) -> ArrayOfSamples:
        """ Get all raw readings used to construct the HTrace object (including both the trace and
        the performance counters) """
        return self._raw

    def get_raw_traces(self) -> npt.NDArray[np.uint64]:
        """ Get all raw traces in the HTrace object (does NOT include performance counters) """
        return self._raw['trace']

    def sample_size(self) -> int:
        """ Get the number of htrace samples in the HTrace object """
        return len(self._raw)

    def get_max_pfc(self) -> PFCTuple:
        """ Get the maximum values of performance counters in the HTrace object """
        if self._max_pfc is None:
            new_max_pfc = (0, 0, 0, 0, 0)
            for sample in self._raw:
                if sample['pfc0'] > new_max_pfc[0]:
                    new_max_pfc = (int(sample['pfc0']), int(sample['pfc1']), int(sample['pfc2']),
                                   int(sample['pfc3']), int(sample['pfc4']))
            self._max_pfc = new_max_pfc
        return self._max_pfc


# ==================================================================================================
# Trace Containers
# ==================================================================================================
class TraceBundle(NamedTuple):
    """
    Container for a set of measurements produced by executing a test case with a given input on
    the model and on the executor. It contains the input, the input ID, the contract trace, the
    hardware trace.
    """
    input_id: InputID
    input_: InputData
    ctrace: CTrace
    htrace: HTrace


HWEquivalenceFunction = Callable[[HTrace, HTrace], bool]


def _default_eq_function(htrace1: HTrace, htrace2: HTrace) -> bool:
    """ Default equivalence function that compares hardware traces for equality """
    return htrace1 == htrace2


class HardwareEqClass:
    """
    Container for a set of TraceBundles that are hardware-equivalent;
    that is, all TraceBundles in the list have similar hardware trace.
    Note that the notion of similarity is configurable and defined by CONF.analyser
    """

    htrace: Final[HTrace]
    """ hardware trace that all measurements in the equivalence class share """

    measurements: Final[List[TraceBundle]]
    """ a list of TraceBundles that are hardware-equivalent """

    # ==============================================================================================
    # Constructors

    def __init__(self, measurements: List[TraceBundle]) -> None:
        self.htrace = measurements[0].htrace
        self.measurements = measurements

    @classmethod
    def build_hw_classes(
        cls,
        measurements: List[TraceBundle],
        equivalence_function: HWEquivalenceFunction = _default_eq_function
    ) -> List[HardwareEqClass]:
        """
        Break down a list of measurements into hardware equivalence classes.
        :param measurements: a list of measurements
        :param equivalence_function: a function that compares two hardware traces and returns True
                if they are equivalent (i.e., they are similar enough to be considered the same)
        :return: List of hardware classes formed from the input measurements
        """
        # Collect lists of measurements with equivalent hardware traces
        hw_groups: Dict[int, List[TraceBundle]] = {}
        diverging_htraces: List[HTrace] = []
        for measurement in measurements:
            htrace = measurement.htrace

            # First iteration: create a new hardware equivalence class
            if not diverging_htraces:
                diverging_htraces.append(htrace)
                hw_groups[hash(htrace)] = [measurement]
                continue

            # Subsequent iterations: check if the htrace is equivalent to any existing class
            for htrace_other in diverging_htraces:
                if equivalence_function(htrace, htrace_other):
                    hw_groups[hash(htrace_other)].append(measurement)
                    break
            else:
                diverging_htraces.append(htrace)
                hw_groups[hash(htrace)] = [measurement]

        # Create HardwareEqClass objects for each group
        hw_classes: List[HardwareEqClass] = []
        for group in hw_groups.values():
            hw_classes.append(cls(group))
        return hw_classes

    # ==============================================================================================
    # Public Methods

    def __len__(self) -> int:
        return len(self.measurements)

    def __iter__(self) -> Generator[TraceBundle, None, None]:
        yield from self.measurements

    def __getitem__(self, index: int) -> TraceBundle:
        return self.measurements[index]

    def __eq__(self, other: object) -> bool:
        """
        Compare two hardware equivalence classes for equality.
        Two classes are equal if they have the same hardware trace and the same measurements.
        """
        if not isinstance(other, HardwareEqClass):
            raise NotImplementedError("Cannot compare HardwareEqClass with object of another type")
        return self.htrace == other.htrace and self.measurements == other.measurements


class ContractEqClass:
    """
    ContractEqClass is a container for a set of TraceBundles that are contract-equivalent;
    that is, all TraceBundles in the list have the same contract trace.
    """

    ctrace: Final[CTrace]
    """ contract trace that all measurements in the equivalence class share """

    measurements: Final[List[TraceBundle]]
    """ list of TraceBundles that are contract-equivalent """

    _hw_classes: Optional[List[HardwareEqClass]] = None

    # ==============================================================================================
    # Constructors

    def __init__(self, measurements: List[TraceBundle]) -> None:
        self.ctrace = measurements[0].ctrace
        self.measurements = measurements

        # check that all measurements have the same contract trace
        for measurement in measurements:
            assert measurement.ctrace == self.ctrace, "All measurements must have the same ctrace"

    @classmethod
    def build_contract_classes(cls, measurements: List[TraceBundle]) -> List[ContractEqClass]:
        """
        Break down a list of measurements into contract equivalence classes
        :param measurements: a list of measurements
        :return: List of contract classes formed from the input measurements
        """
        # Collect lists of measurements with equivalent contract traces
        eq_groups: Dict[int, List[TraceBundle]] = {}
        for measurement in measurements:
            ctrace = measurement.ctrace
            hash_ = hash(ctrace)
            if hash_ not in eq_groups:
                eq_groups[hash_] = [measurement]
            else:
                eq_groups[hash_].append(measurement)

        # Create ContractEqClass objects for each group
        eq_classes: List[ContractEqClass] = []
        for group in eq_groups.values():
            eq_classes.append(cls(group))
        return eq_classes

    def __len__(self) -> int:
        return len(self.measurements)

    def set_hw_classes(self, hw_classes: List[HardwareEqClass]) -> None:
        """
        Set the hardware equivalence classes for this contract equivalence class.
        :param hw_classes: a dictionary of hardware equivalence classes indexed by htrace hash
        """
        assert self._hw_classes is None, "Attempting to set hardware equivalence classes twice"
        self._hw_classes = hw_classes

    def set_trivial_hw_classes(self) -> None:
        """
        Set the hardware equivalence classes for this contract equivalence class by directly
        comparing hardware traces for equality.
        """
        assert self._hw_classes is None, "Attempting to set hardware equivalence classes twice"
        self._hw_classes = HardwareEqClass.build_hw_classes(self.measurements)

    def get_hw_classes(self) -> List[HardwareEqClass]:
        """
        Get a dictionary of all hardware equivalence classes
        in the contract equivalence class; indexed by htrace hash.
        """
        assert self._hw_classes is not None, "Hardware equivalence classes not set"
        return self._hw_classes


class Violation(ContractEqClass):
    """
    Violation is a special type of equivalence class that represents a violation of a contract.
    It is a container for a list of measurements (TraceBundle) that triggered the violation
    as well as a complete sequence of inputs that triggered the violation and the test case program.
    """

    input_sequence: List[InputData]
    """ complete sequence of inputs that triggered the violation """

    test_case_code: Final[TestCaseProgram]
    """ test case program that triggered the violation """

    # ==============================================================================================
    # Constructors

    def __init__(self, measurements: List[TraceBundle], input_sequence: List[InputData],
                 test_case_code: TestCaseProgram) -> None:
        super().__init__(measurements)
        self.input_sequence = input_sequence
        self.test_case_code = test_case_code

    @classmethod
    def from_contract_eq_class(cls, eq_class: ContractEqClass, input_sequence: List[InputData],
                               test_case_code: TestCaseProgram) -> Violation:
        """
        Create a Violation object from a ContractEqClass object
        :param eq_class: ContractEquivalenceClass object
        :param input_sequence: complete sequence of inputs that triggered the violation
        :return: Violation object
        """
        violation = cls(eq_class.measurements, input_sequence, test_case_code)
        violation.set_hw_classes(eq_class.get_hw_classes())
        return violation

    @classmethod
    def pseudo_violation_from_inputs(cls, input_sequence: List[InputData],
                                     test_case_code: TestCaseProgram) -> Violation:
        """
        Create a pseudo-violation object from a list of inputs.

        This interface is used by the variants of the fuzzer that rely on non-standard definition
        of violations (e.g., ArchFuzzer). Such fuzzers may not produce traces, yet they still
        have to return a violation object from the analyser.

        :param input_: input that triggered the pseudo-violation
        :return: Violation object
        """
        measurements = []
        hw_classes = []
        for i, input_ in enumerate(input_sequence):
            bundle = TraceBundle(InputID(i), input_, CTrace.empty_trace(), HTrace.empty_trace())
            measurements.append(bundle)
            hw_classes.append(HardwareEqClass([bundle]))
        violation = cls(measurements, input_sequence, test_case_code)
        violation.set_hw_classes(hw_classes)
        return violation

    # ==============================================================================================
    # Public Methods
    def full_str(self, region1_col: str = "", region2_col: str = "", reset_col: str = "") -> str:
        """
        Return a string representation of the violation, including the contract and hardware
        traces of all measurements in the violation
        """
        # pylint: disable=too-many-locals  # justification: the method is clear enough as is

        s = "Violation Details:\n"

        # Four cases to consider:
        hw_classes = self._hw_classes

        # 1. No hardware equivalence classes (set_hw_classes() was never called)
        if hw_classes is None or not hw_classes:
            s += f"  Contract trace: (hash {self.ctrace})\n"
            s += f"    {self.ctrace.full_str()} \n"
            s += "  Hardware traces:\n"
            for measurement in self.measurements:
                s += measurement.htrace.full_str("    ") + "\n"
            return s

        # 2. Only one measurement in the violation (normally the case for ArchFuzzer)
        if len(hw_classes) == 1:
            s += "  Special Case: Single-input violation\n"
            s += f"  Input ID: {self.measurements[0].input_id}\n"
            s += f"  Contract trace: (hash {self.ctrace})\n"
            s += f"    {self.ctrace.full_str()} \n"
            s += "  Hardware traces:\n"
            s += f"    {hw_classes[0].htrace.full_str()} \n"
            return s

        # 3. If there are two HW classes, print them side by side for improved readability
        hw_classes = self.get_hw_classes()
        if len(hw_classes) == 2:
            inputs1 = [m.input_id for m in hw_classes[0]]
            inputs2 = [m.input_id for m in hw_classes[1]]
            htrace1 = hw_classes[0][0].htrace
            htrace2 = hw_classes[1][0].htrace
            trace_table = htrace1.full_pair_str(htrace2, region1_col, region2_col, reset_col)

            line_width = max(len(line) for line in trace_table.splitlines())
            assert line_width > 19, "Invalid trace table"
            trace_width = line_width - 19

            header = "\n" + "-" * line_width + "\n"
            header += f"{'HTrace':^{trace_width}} | ID:{inputs1[0]:<3} | ID:{inputs2[0]:<3}|\n"
            header += "-" * line_width + "\n"
            s += header + trace_table
            return s

        # 4. With more than two HW classes, print each HW class separately
        for hw_class in hw_classes:
            inputs = [measurement.input_id for measurement in hw_class]
            s += "  Inputs "
            s += f"{inputs}\n" if len(inputs) < 4 else f"{inputs[:4]} (+ {len(inputs) - 4} )\n"
            s += hw_class.htrace.full_str("    ", region1_col, region2_col, reset_col)
        s += "\n"
        return s


================================================
FILE: rvzr/unicorn.pyi
================================================
"""
mypy stub for unicorn
"""
# pylint: disable=missing-docstring, unused-argument
from typing import Optional, Callable, Any, Generator, Tuple


class Uc(object):

    def __init__(self, arch: int, mode: int):
        ...

    def emu_start(self, begin: int, until: int, timeout: int = 0, count: int = 0) -> None:
        ...

    def emu_stop(self) -> None:
        ...

    def reg_read(self, reg_id: int, opt: Optional[int] = None) -> int:
        ...

    def reg_write(self, reg_id: int, value: int) -> None:
        ...

    def msr_read(self, msr_id: int) -> int:
        ...

    def msr_write(self, msr_id: int, value: int) -> None:
        ...

    def mem_read(self, address: int, size: int) -> bytearray:
        ...

    def mem_write(self, address: int, data: bytes) -> None:
        ...

    def mem_map(self, address: int, size: int, perms: int = ...) -> None:
        ...

    def mem_map_ptr(self, address: int, size: int, perms: int, ptr: int) -> None:
        ...

    def mem_unmap(self, address: int, size: int) -> None:
        ...

    def mem_protect(self, address: int, size: int, perms: int = ...) -> None:
        ...

    def query(self, query_mode: int) -> int:
        ...

    def hook_add(self,
                 htype: int,
                 callback: Callable[['Uc', int, int, int, int, Any], None]
                 | Callable[['Uc', int, int, Any], None],
                 user_data: Any = None,
                 begin: int = 1,
                 end: int = 0,
                 arg1: int = 0) -> None:
        ...

    def hook_del(self, h: int) -> None:
        ...

    def context_save(self) -> object:
        ...

    def context_update(self, context: object) -> None:
        ...

    def context_restore(self, context: object) -> None:
        ...

    def mem_regions(self) -> Generator[Tuple[int, int], None, None]:
        ...


class UcError(BaseException):
    ...


# Constants
UC_API_MAJOR: int
UC_API_MINOR: int
UC_VERSION_MAJOR: int
UC_VERSION_MINOR: int
UC_VERSION_EXTRA: int
UC_SECOND_SCALE: int
UC_MILISECOND_SCALE: int
UC_ARCH_ARM: int
UC_ARCH_ARM64: int
UC_ARCH_MIPS: int
UC_ARCH_X86: int
UC_ARCH_PPC: int
UC_ARCH_SPARC: int
UC_ARCH_M68K: int
UC_ARCH_MAX: int
UC_MODE_LITTLE_ENDIAN: int
UC_MODE_BIG_ENDIAN: int
UC_MODE_ARM: int
UC_MODE_THUMB: int
UC_MODE_MCLASS: int
UC_MODE_V8: int
UC_MODE_ARM926: int
UC_MODE_ARM946: int
UC_MODE_ARM1176: int
UC_MODE_MICRO: int
UC_MODE_MIPS3: int
UC_MODE_MIPS32R6: int
UC_MODE_MIPS32: int
UC_MODE_MIPS64: int
UC_MODE_16: int
UC_MODE_32: int
UC_MODE_64: int
UC_MODE_PPC32: int
UC_MODE_PPC64: int
UC_MODE_QPX: int
UC_MODE_SPARC32: int
UC_MODE_SPARC64: int
UC_MODE_V9: int
UC_ERR_OK: int
UC_ERR_NOMEM: int
UC_ERR_ARCH: int
UC_ERR_HANDLE: int
UC_ERR_MODE: int
UC_ERR_VERSION: int
UC_ERR_READ_UNMAPPED: int
UC_ERR_WRITE_UNMAPPED: int
UC_ERR_FETCH_UNMAPPED: int
UC_ERR_HOOK: int
UC_ERR_INSN_INVALID: int
UC_ERR_MAP: int
UC_ERR_WRITE_PROT: int
UC_ERR_READ_PROT: int
UC_ERR_FETCH_PROT: int
UC_ERR_ARG: int
UC_ERR_READ_UNALIGNED: int
UC_ERR_WRITE_UNALIGNED: int
UC_ERR_FETCH_UNALIGNED: int
UC_ERR_HOOK_EXIST: int
UC_ERR_RESOURCE: int
UC_ERR_EXCEPTION: int
UC_MEM_READ: int
UC_MEM_WRITE: int
UC_MEM_FETCH: int
UC_MEM_READ_UNMAPPED: int
UC_MEM_WRITE_UNMAPPED: int
UC_MEM_FETCH_UNMAPPED: int
UC_MEM_WRITE_PROT: int
UC_MEM_READ_PROT: int
UC_MEM_FETCH_PROT: int
UC_MEM_READ_AFTER: int
UC_HOOK_INTR: int
UC_HOOK_INSN: int
UC_HOOK_CODE: int
UC_HOOK_BLOCK: int
UC_HOOK_MEM_READ_UNMAPPED: int
UC_HOOK_MEM_WRITE_UNMAPPED: int
UC_HOOK_MEM_FETCH_UNMAPPED: int
UC_HOOK_MEM_READ_PROT: int
UC_HOOK_MEM_WRITE_PROT: int
UC_HOOK_MEM_FETCH_PROT: int
UC_HOOK_MEM_READ: int
UC_HOOK_MEM_WRITE: int
UC_HOOK_MEM_FETCH: int
UC_HOOK_MEM_READ_AFTER: int
UC_HOOK_INSN_INVALID: int
UC_HOOK_MEM_UNMAPPED: int
UC_HOOK_MEM_PROT: int
UC_HOOK_MEM_READ_INVALID: int
UC_HOOK_MEM_WRITE_INVALID: int
UC_HOOK_MEM_FETCH_INVALID: int
UC_HOOK_MEM_INVALID: int
UC_HOOK_MEM_VALID: int
UC_QUERY_MODE: int
UC_QUERY_PAGE_SIZE: int
UC_QUERY_ARCH: int
UC_QUERY_TIMEOUT: int
UC_PROT_NONE: int
UC_PROT_READ: int
UC_PROT_WRITE: int
UC_PROT_EXEC: int
UC_PROT_ALL: int

# X86 registers
UC_X86_REG_INVALID: int
UC_X86_REG_AH: int
UC_X86_REG_AL: int
UC_X86_REG_AX: int
UC_X86_REG_BH: int
UC_X86_REG_BL: int
UC_X86_REG_BP: int
UC_X86_REG_BPL: int
UC_X86_REG_BX: int
UC_X86_REG_CH: int
UC_X86_REG_CL: int
UC_X86_REG_CS: int
UC_X86_REG_CX: int
UC_X86_REG_DH: int
UC_X86_REG_DI: int
UC_X86_REG_DIL: int
UC_X86_REG_DL: int
UC_X86_REG_DS: int
UC_X86_REG_DX: int
UC_X86_REG_EAX: int
UC_X86_REG_EBP: int
UC_X86_REG_EBX: int
UC_X86_REG_ECX: int
UC_X86_REG_EDI: int
UC_X86_REG_EDX: int
UC_X86_REG_EFLAGS: int
UC_X86_REG_EIP: int
UC_X86_REG_EIZ: int
UC_X86_REG_ES: int
UC_X86_REG_ESI: int
UC_X86_REG_ESP: int
UC_X86_REG_FPSW: int
UC_X86_REG_FS: int
UC_X86_REG_GS: int
UC_X86_REG_IP: int
UC_X86_REG_RAX: int
UC_X86_REG_RBP: int
UC_X86_REG_RBX: int
UC_X86_REG_RCX: int
UC_X86_REG_RDI: int
UC_X86_REG_RDX: int
UC_X86_REG_RIP: int
UC_X86_REG_RIZ: int
UC_X86_REG_RSI: int
UC_X86_REG_RSP: int
UC_X86_REG_SI: int
UC_X86_REG_SIL: int
UC_X86_REG_SP: int
UC_X86_REG_SPL: int
UC_X86_REG_SS: int
UC_X86_REG_CR0: int
UC_X86_REG_CR1: int
UC_X86_REG_CR2: int
UC_X86_REG_CR3: int
UC_X86_REG_CR4: int
UC_X86_REG_CR5: int
UC_X86_REG_CR6: int
UC_X86_REG_CR7: int
UC_X86_REG_CR8: int
UC_X86_REG_CR9: int
UC_X86_REG_CR10: int
UC_X86_REG_CR11: int
UC_X86_REG_CR12: int
UC_X86_REG_CR13: int
UC_X86_REG_CR14: int
UC_X86_REG_CR15: int
UC_X86_REG_DR0: int
UC_X86_REG_DR1: int
UC_X86_REG_DR2: int
UC_X86_REG_DR3: int
UC_X86_REG_DR4: int
UC_X86_REG_DR5: int
UC_X86_REG_DR6: int
UC_X86_REG_DR7: int
UC_X86_REG_DR8: int
UC_X86_REG_DR9: int
UC_X86_REG_DR10: int
UC_X86_REG_DR11: int
UC_X86_REG_DR12: int
UC_X86_REG_DR13: int
UC_X86_REG_DR14: int
UC_X86_REG_DR15: int
UC_X86_REG_FP0: int
UC_X86_REG_FP1: int
UC_X86_REG_FP2: int
UC_X86_REG_FP3: int
UC_X86_REG_FP4: int
UC_X86_REG_FP5: int
UC_X86_REG_FP6: int
UC_X86_REG_FP7: int
UC_X86_REG_K0: int
UC_X86_REG_K1: int
UC_X86_REG_K2: int
UC_X86_REG_K3: int
UC_X86_REG_K4: int
UC_X86_REG_K5: int
UC_X86_REG_K6: int
UC_X86_REG_K7: int
UC_X86_REG_MM0: int
UC_X86_REG_MM1: int
UC_X86_REG_MM2: int
UC_X86_REG_MM3: int
UC_X86_REG_MM4: int
UC_X86_REG_MM5: int
UC_X86_REG_MM6: int
UC_X86_REG_MM7: int
UC_X86_REG_R8: int
UC_X86_REG_R9: int
UC_X86_REG_R10: int
UC_X86_REG_R11: int
UC_X86_REG_R12: int
UC_X86_REG_R13: int
UC_X86_REG_R14: int
UC_X86_REG_R15: int
UC_X86_REG_ST0: int
UC_X86_REG_ST1: int
UC_X86_REG_ST2: int
UC_X86_REG_ST3: int
UC_X86_REG_ST4: int
UC_X86_REG_ST5: int
UC_X86_REG_ST6: int
UC_X86_REG_ST7: int
UC_X86_REG_XMM0: int
UC_X86_REG_XMM1: int
UC_X86_REG_XMM2: int
UC_X86_REG_XMM3: int
UC_X86_REG_XMM4: int
UC_X86_REG_XMM5: int
UC_X86_REG_XMM6: int
UC_X86_REG_XMM7: int
UC_X86_REG_XMM8: int
UC_X86_REG_XMM9: int
UC_X86_REG_XMM10: int
UC_X86_REG_XMM11: int
UC_X86_REG_XMM12: int
UC_X86_REG_XMM13: int
UC_X86_REG_XMM14: int
UC_X86_REG_XMM15: int
UC_X86_REG_XMM16: int
UC_X86_REG_XMM17: int
UC_X86_REG_XMM18: int
UC_X86_REG_XMM19: int
UC_X86_REG_XMM20: int
UC_X86_REG_XMM21: int
UC_X86_REG_XMM22: int
UC_X86_REG_XMM23: int
UC_X86_REG_XMM24: int
UC_X86_REG_XMM25: int
UC_X86_REG_XMM26: int
UC_X86_REG_XMM27: int
UC_X86_REG_XMM28: int
UC_X86_REG_XMM29: int
UC_X86_REG_XMM30: int
UC_X86_REG_XMM31: int
UC_X86_REG_YMM0: int
UC_X86_REG_YMM1: int
UC_X86_REG_YMM2: int
UC_X86_REG_YMM3: int
UC_X86_REG_YMM4: int
UC_X86_REG_YMM5: int
UC_X86_REG_YMM6: int
UC_X86_REG_YMM7: int
UC_X86_REG_YMM8: int
UC_X86_REG_YMM9: int
UC_X86_REG_YMM10: int
UC_X86_REG_YMM11: int
UC_X86_REG_YMM12: int
UC_X86_REG_YMM13: int
UC_X86_REG_YMM14: int
UC_X86_REG_YMM15: int
UC_X86_REG_YMM16: int
UC_X86_REG_YMM17: int
UC_X86_REG_YMM18: int
UC_X86_REG_YMM19: int
UC_X86_REG_YMM20: int
UC_X86_REG_YMM21: int
UC_X86_REG_YMM22: int
UC_X86_REG_YMM23: int
UC_X86_REG_YMM24: int
UC_X86_REG_YMM25: int
UC_X86_REG_YMM26: int
UC_X86_REG_YMM27: int
UC_X86_REG_YMM28: int
UC_X86_REG_YMM29: int
UC_X86_REG_YMM30: int
UC_X86_REG_YMM31: int
UC_X86_REG_ZMM0: int
UC_X86_REG_ZMM1: int
UC_X86_REG_ZMM2: int
UC_X86_REG_ZMM3: int
UC_X86_REG_ZMM4: int
UC_X86_REG_ZMM5: int
UC_X86_REG_ZMM6: int
UC_X86_REG_ZMM7: int
UC_X86_REG_ZMM8: int
UC_X86_REG_ZMM9: int
UC_X86_REG_ZMM10: int
UC_X86_REG_ZMM11: int
UC_X86_REG_ZMM12: int
UC_X86_REG_ZMM13: int
UC_X86_REG_ZMM14: int
UC_X86_REG_ZMM15: int
UC_X86_REG_ZMM16: int
UC_X86_REG_ZMM17: int
UC_X86_REG_ZMM18: int
UC_X86_REG_ZMM19: int
UC_X86_REG_ZMM20: int
UC_X86_REG_ZMM21: int
UC_X86_REG_ZMM22: int
UC_X86_REG_ZMM23: int
UC_X86_REG_ZMM24: int
UC_X86_REG_ZMM25: int
UC_X86_REG_ZMM26: int
UC_X86_REG_ZMM27: int
UC_X86_REG_ZMM28: int
UC_X86_REG_ZMM29: int
UC_X86_REG_ZMM30: int
UC_X86_REG_ZMM31: int
UC_X86_REG_R8B: int
UC_X86_REG_R9B: int
UC_X86_REG_R10B: int
UC_X86_REG_R11B: int
UC_X86_REG_R12B: int
UC_X86_REG_R13B: int
UC_X86_REG_R14B: int
UC_X86_REG_R15B: int
UC_X86_REG_R8D: int
UC_X86_REG_R9D: int
UC_X86_REG_R10D: int
UC_X86_REG_R11D: int
UC_X86_REG_R12D: int
UC_X86_REG_R13D: int
UC_X86_REG_R14D: int
UC_X86_REG_R15D: int
UC_X86_REG_R8W: int
UC_X86_REG_R9W: int
UC_X86_REG_R10W: int
UC_X86_REG_R11W: int
UC_X86_REG_R12W: int
UC_X86_REG_R13W: int
UC_X86_REG_R14W: int
UC_X86_REG_R15W: int
UC_X86_REG_IDTR: int
UC_X86_REG_GDTR: int
UC_X86_REG_LDTR: int
UC_X86_REG_TR: int
UC_X86_REG_FPCW: int
UC_X86_REG_FPTAG: int
UC_X86_REG_MSR: int
UC_X86_REG_MXCSR: int
UC_X86_REG_FS_BASE: int
UC_X86_REG_GS_BASE: int
UC_X86_REG_ENDING: int

# X86 instructions

UC_X86_INS_INVALID: int
UC_X86_INS_AAA: int
UC_X86_INS_AAD: int
UC_X86_INS_AAM: int
UC_X86_INS_AAS: int
UC_X86_INS_FABS: int
UC_X86_INS_ADC: int
UC_X86_INS_ADCX: int
UC_X86_INS_ADD: int
UC_X86_INS_ADDPD: int
UC_X86_INS_ADDPS: int
UC_X86_INS_ADDSD: int
UC_X86_INS_ADDSS: int
UC_X86_INS_ADDSUBPD: int
UC_X86_INS_ADDSUBPS: int
UC_X86_INS_FADD: int
UC_X86_INS_FIADD: int
UC_X86_INS_FADDP: int
UC_X86_INS_ADOX: int
UC_X86_INS_AESDECLAST: int
UC_X86_INS_AESDEC: int
UC_X86_INS_AESENCLAST: int
UC_X86_INS_AESENC: int
UC_X86_INS_AESIMC: int
UC_X86_INS_AESKEYGENASSIST: int
UC_X86_INS_AND: int
UC_X86_INS_ANDN: int
UC_X86_INS_ANDNPD: int
UC_X86_INS_ANDNPS: int
UC_X86_INS_ANDPD: int
UC_X86_INS_ANDPS: int
UC_X86_INS_ARPL: int
UC_X86_INS_BEXTR: int
UC_X86_INS_BLCFILL: int
UC_X86_INS_BLCI: int
UC_X86_INS_BLCIC: int
UC_X86_INS_BLCMSK: int
UC_X86_INS_BLCS: int
UC_X86_INS_BLENDPD: int
UC_X86_INS_BLENDPS: int
UC_X86_INS_BLENDVPD: int
UC_X86_INS_BLENDVPS: int
UC_X86_INS_BLSFILL: int
UC_X86_INS_BLSI: int
UC_X86_INS_BLSIC: int
UC_X86_INS_BLSMSK: int
UC_X86_INS_BLSR: int
UC_X86_INS_BOUND: int
UC_X86_INS_BSF: int
UC_X86_INS_BSR: int
UC_X86_INS_BSWAP: int
UC_X86_INS_BT: int
UC_X86_INS_BTC: int
UC_X86_INS_BTR: int
UC_X86_INS_BTS: int
UC_X86_INS_BZHI: int
UC_X86_INS_CALL: int
UC_X86_INS_CBW: int
UC_X86_INS_CDQ: int
UC_X86_INS_CDQE: int
UC_X86_INS_FCHS: int
UC_X86_INS_CLAC: int
UC_X86_INS_CLC: int
UC_X86_INS_CLD: int
UC_X86_INS_CLFLUSH: int
UC_X86_INS_CLFLUSHOPT: int
UC_X86_INS_CLGI: int
UC_X86_INS_CLI: int
UC_X86_INS_CLTS: int
UC_X86_INS_CLWB: int
UC_X86_INS_CMC: int
UC_X86_INS_CMOVA: int
UC_X86_INS_CMOVAE: int
UC_X86_INS_CMOVB: int
UC_X86_INS_CMOVBE: int
UC_X86_INS_FCMOVBE: int
UC_X86_INS_FCMOVB: int
UC_X86_INS_CMOVE: int
UC_X86_INS_FCMOVE: int
UC_X86_INS_CMOVG: int
UC_X86_INS_CMOVGE: int
UC_X86_INS_CMOVL: int
UC_X86_INS_CMOVLE: int
UC_X86_INS_FCMOVNBE: int
UC_X86_INS_FCMOVNB: int
UC_X86_INS_CMOVNE: int
UC_X86_INS_FCMOVNE: int
UC_X86_INS_CMOVNO: int
UC_X86_INS_CMOVNP: int
UC_X86_INS_FCMOVNU: int
UC_X86_INS_CMOVNS: int
UC_X86_INS_CMOVO: int
UC_X86_INS_CMOVP: int
UC_X86_INS_FCMOVU: int
UC_X86_INS_CMOVS: int
UC_X86_INS_CMP: int
UC_X86_INS_CMPPD: int
UC_X86_INS_CMPPS: int
UC_X86_INS_CMPSB: int
UC_X86_INS_CMPSD: int
UC_X86_INS_CMPSQ: int
UC_X86_INS_CMPSS: int
UC_X86_INS_CMPSW: int
UC_X86_INS_CMPXCHG16B: int
UC_X86_INS_CMPXCHG: int
UC_X86_INS_CMPXCHG8B: int
UC_X86_INS_COMISD: int
UC_X86_INS_COMISS: int
UC_X86_INS_FCOMP: int
UC_X86_INS_FCOMPI: int
UC_X86_INS_FCOMI: int
UC_X86_INS_FCOM: int
UC_X86_INS_FCOS: int
UC_X86_INS_CPUID: int
UC_X86_INS_CQO: int
UC_X86_INS_CRC32: int
UC_X86_INS_CVTDQ2PD: int
UC_X86_INS_CVTDQ2PS: int
UC_X86_INS_CVTPD2DQ: int
UC_X86_INS_CVTPD2PS: int
UC_X86_INS_CVTPS2DQ: int
UC_X86_INS_CVTPS2PD: int
UC_X86_INS_CVTSD2SI: int
UC_X86_INS_CVTSD2SS: int
UC_X86_INS_CVTSI2SD: int
UC_X86_INS_CVTSI2SS: int
UC_X86_INS_CVTSS2SD: int
UC_X86_INS_CVTSS2SI: int
UC_X86_INS_CVTTPD2DQ: int
UC_X86_INS_CVTTPS2DQ: int
UC_X86_INS_CVTTSD2SI: int
UC_X86_INS_CVTTSS2SI: int
UC_X86_INS_CWD: int
UC_X86_INS_CWDE: int
UC_X86_INS_DAA: int
UC_X86_INS_DAS: int
UC_X86_INS_DATA16: int
UC_X86_INS_DEC: int
UC_X86_INS_DIV: int
UC_X86_INS_DIVPD: int
UC_X86_INS_DIVPS: int
UC_X86_INS_FDIVR: int
UC_X86_INS_FIDIVR: int
UC_X86_INS_FDIVRP: int
UC_X86_INS_DIVSD: int
UC_X86_INS_DIVSS: int
UC_X86_INS_FDIV: int
UC_X86_INS_FIDIV: int
UC_X86_INS_FDIVP: int
UC_X86_INS_DPPD: int
UC_X86_INS_DPPS: int
UC_X86_INS_RET: int
UC_X86_INS_ENCLS: int
UC_X86_INS_ENCLU: int
UC_X86_INS_ENTER: int
UC_X86_INS_EXTRACTPS: int
UC_X86_INS_EXTRQ: int
UC_X86_INS_F2XM1: int
UC_X86_INS_LCALL: int
UC_X86_INS_LJMP: int
UC_X86_INS_FBLD: int
UC_X86_INS_FBSTP: int
UC_X86_INS_FCOMPP: int
UC_X86_INS_FDECSTP: int
UC_X86_INS_FEMMS: int
UC_X86_INS_FFREE: int
UC_X86_INS_FICOM: int
UC_X86_INS_FICOMP: int
UC_X86_INS_FINCSTP: int
UC_X86_INS_FLDCW: int
UC_X86_INS_FLDENV: int
UC_X86_INS_FLDL2E: int
UC_X86_INS_FLDL2T: int
UC_X86_INS_FLDLG2: int
UC_X86_INS_FLDLN2: int
UC_X86_INS_FLDPI: int
UC_X86_INS_FNCLEX: int
UC_X86_INS_FNINIT: int
UC_X86_INS_FNOP: int
UC_X86_INS_FNSTCW: int
UC_X86_INS_FNSTSW: int
UC_X86_INS_FPATAN: int
UC_X86_INS_FPREM: int
UC_X86_INS_FPREM1: int
UC_X86_INS_FPTAN: int
UC_X86_INS_FFREEP: int
UC_X86_INS_FRNDINT: int
UC_X86_INS_FRSTOR: int
UC_X86_INS_FNSAVE: int
UC_X86_INS_FSCALE: int
UC_X86_INS_FSETPM: int
UC_X86_INS_FSINCOS: int
UC_X86_INS_FNSTENV: int
UC_X86_INS_FXAM: int
UC_X86_INS_FXRSTOR: int
UC_X86_INS_FXRSTOR64: int
UC_X86_INS_FXSAVE: int
UC_X86_INS_FXSAVE64: int
UC_X86_INS_FXTRACT: int
UC_X86_INS_FYL2X: int
UC_X86_INS_FYL2XP1: int
UC_X86_INS_MOVAPD: int
UC_X86_INS_MOVAPS: int
UC_X86_INS_ORPD: int
UC_X86_INS_ORPS: int
UC_X86_INS_VMOVAPD: int
UC_X86_INS_VMOVAPS: int
UC_X86_INS_XORPD: int
UC_X86_INS_XORPS: int
UC_X86_INS_GETSEC: int
UC_X86_INS_HADDPD: int
UC_X86_INS_HADDPS: int
UC_X86_INS_HLT: int
UC_X86_INS_HSUBPD: int
UC_X86_INS_HSUBPS: int
UC_X86_INS_IDIV: int
UC_X86_INS_FILD: int
UC_X86_INS_IMUL: int
UC_X86_INS_IN: int
UC_X86_INS_INC: int
UC_X86_INS_INSB: int
UC_X86_INS_INSERTPS: int
UC_X86_INS_INSERTQ: int
UC_X86_INS_INSD: int
UC_X86_INS_INSW: int
UC_X86_INS_INT: int
UC_X86_INS_INT1: int
UC_X86_INS_INT3: int
UC_X86_INS_INTO: int
UC_X86_INS_INVD: int
UC_X86_INS_INVEPT: int
UC_X86_INS_INVLPG: int
UC_X86_INS_INVLPGA: int
UC_X86_INS_INVPCID: int
UC_X86_INS_INVVPID: int
UC_X86_INS_IRET: int
UC_X86_INS_IRETD: int
UC_X86_INS_IRETQ: int
UC_X86_INS_FISTTP: int
UC_X86_INS_FIST: int
UC_X86_INS_FISTP: int
UC_X86_INS_UCOMISD: int
UC_X86_INS_UCOMISS: int
UC_X86_INS_VCOMISD: int
UC_X86_INS_VCOMISS: int
UC_X86_INS_VCVTSD2SS: int
UC_X86_INS_VCVTSI2SD: int
UC_X86_INS_VCVTSI2SS: int
UC_X86_INS_VCVTSS2SD: int
UC_X86_INS_VCVTTSD2SI: int
UC_X86_INS_VCVTTSD2USI: int
UC_X86_INS_VCVTTSS2SI: int
UC_X86_INS_VCVTTSS2USI: int
UC_X86_INS_VCVTUSI2SD: int
UC_X86_INS_VCVTUSI2SS: int
UC_X86_INS_VUCOMISD: int
UC_X86_INS_VUCOMISS: int
UC_X86_INS_JAE: int
UC_X86_INS_JA: int
UC_X86_INS_JBE: int
UC_X86_INS_JB: int
UC_X86_INS_JCXZ: int
UC_X86_INS_JECXZ: int
UC_X86_INS_JE: int
UC_X86_INS_JGE: int
UC_X86_INS_JG: int
UC_X86_INS_JLE: int
UC_X86_INS_JL: int
UC_X86_INS_JMP: int
UC_X86_INS_JNE: int
UC_X86_INS_JNO: int
UC_X86_INS_JNP: int
UC_X86_INS_JNS: int
UC_X86_INS_JO: int
UC_X86_INS_JP: int
UC_X86_INS_JRCXZ: int
UC_X86_INS_JS: int
UC_X86_INS_KANDB: int
UC_X86_INS_KANDD: int
UC_X86_INS_KANDNB: int
UC_X86_INS_KANDND: int
UC_X86_INS_KANDNQ: int
UC_X86_INS_KANDNW: int
UC_X86_INS_KANDQ: int
UC_X86_INS_KANDW: int
UC_X86_INS_KMOVB: int
UC_X86_INS_KMOVD: int
UC_X86_INS_KMOVQ: int
UC_X86_INS_KMOVW: int
UC_X86_INS_KNOTB: int
UC_X86_INS_KNOTD: int
UC_X86_INS_KNOTQ: int
UC_X86_INS_KNOTW: int
UC_X86_INS_KORB: int
UC_X86_INS_KORD: int
UC_X86_INS_KORQ: int
UC_X86_INS_KORTESTB: int
UC_X86_INS_KORTESTD: int
UC_X86_INS_KORTESTQ: int
UC_X86_INS_KORTESTW: int
UC_X86_INS_KORW: int
UC_X86_INS_KSHIFTLB: int
UC_X86_INS_KSHIFTLD: int
UC_X86_INS_KSHIFTLQ: int
UC_X86_INS_KSHIFTLW: int
UC_X86_INS_KSHIFTRB: int
UC_X86_INS_KSHIFTRD: int
UC_X86_INS_KSHIFTRQ: int
UC_X86_INS_KSHIFTRW: int
UC_X86_INS_KUNPCKBW: int
UC_X86_INS_KXNORB: int
UC_X86_INS_KXNORD: int
UC_X86_INS_KXNORQ: int
UC_X86_INS_KXNORW: int
UC_X86_INS_KXORB: int
UC_X86_INS_KXORD: int
UC_X86_INS_KXORQ: int
UC_X86_INS_KXORW: int
UC_X86_INS_LAHF: int
UC_X86_INS_LAR: int
UC_X86_INS_LDDQU: int
UC_X86_INS_LDMXCSR: int
UC_X86_INS_LDS: int
UC_X86_INS_FLDZ: int
UC_X86_INS_FLD1: int
UC_X86_INS_FLD: int
UC_X86_INS_LEA: int
UC_X86_INS_LEAVE: int
UC_X86_INS_LES: int
UC_X86_INS_LFENCE: int
UC_X86_INS_LFS: int
UC_X86_INS_LGDT: int
UC_X86_INS_LGS: int
UC_X86_INS_LIDT: int
UC_X86_INS_LLDT: int
UC_X86_INS_LMSW: int
UC_X86_INS_OR: int
UC_X86_INS_SUB: int
UC_X86_INS_XOR: int
UC_X86_INS_LODSB: int
UC_X86_INS_LODSD: int
UC_X86_INS_LODSQ: int
UC_X86_INS_LODSW: int
UC_X86_INS_LOOP: int
UC_X86_INS_LOOPE: int
UC_X86_INS_LOOPNE: int
UC_X86_INS_RETF: int
UC_X86_INS_RETFQ: int
UC_X86_INS_LSL: int
UC_X86_INS_LSS: int
UC_X86_INS_LTR: int
UC_X86_INS_XADD: int
UC_X86_INS_LZCNT: int
UC_X86_INS_MASKMOVDQU: int
UC_X86_INS_MAXPD: int
UC_X86_INS_MAXPS: int
UC_X86_INS_MAXSD: int
UC_X86_INS_MAXSS: int
UC_X86_INS_MFENCE: int
UC_X86_INS_MINPD: int
UC_X86_INS_MINPS: int
UC_X86_INS_MINSD: int
UC_X86_INS_MINSS: int
UC_X86_INS_CVTPD2PI: int
UC_X86_INS_CVTPI2PD: int
UC_X86_INS_CVTPI2PS: int
UC_X86_INS_CVTPS2PI: int
UC_X86_INS_CVTTPD2PI: int
UC_X86_INS_CVTTPS2PI: int
UC_X86_INS_EMMS: int
UC_X86_INS_MASKMOVQ: int
UC_X86_INS_MOVD: int
UC_X86_INS_MOVDQ2Q: int
UC_X86_INS_MOVNTQ: int
UC_X86_INS_MOVQ2DQ: int
UC_X86_INS_MOVQ: int
UC_X86_INS_PABSB: int
UC_X86_INS_PABSD: int
UC_X86_INS_PABSW: int
UC_X86_INS_PACKSSDW: int
UC_X86_INS_PACKSSWB: int
UC_X86_INS_PACKUSWB: int
UC_X86_INS_PADDB: int
UC_X86_INS_PADDD: int
UC_X86_INS_PADDQ: int
UC_X86_INS_PADDSB: int
UC_X86_INS_PADDSW: int
UC_X86_INS_PADDUSB: int
UC_X86_INS_PADDUSW: int
UC_X86_INS_PADDW: int
UC_X86_INS_PALIGNR: int
UC_X86_INS_PANDN: int
UC_X86_INS_PAND: int
UC_X86_INS_PAVGB: int
UC_X86_INS_PAVGW: int
UC_X86_INS_PCMPEQB: int
UC_X86_INS_PCMPEQD: int
UC_X86_INS_PCMPEQW: int
UC_X86_INS_PCMPGTB: int
UC_X86_INS_PCMPGTD: int
UC_X86_INS_PCMPGTW: int
UC_X86_INS_PEXTRW: int
UC_X86_INS_PHADDSW: int
UC_X86_INS_PHADDW: int
UC_X86_INS_PHADDD: int
UC_X86_INS_PHSUBD: int
UC_X86_INS_PHSUBSW: int
UC_X86_INS_PHSUBW: int
UC_X86_INS_PINSRW: int
UC_X86_INS_PMADDUBSW: int
UC_X86_INS_PMADDWD: int
UC_X86_INS_PMAXSW: int
UC_X86_INS_PMAXUB: int
UC_X86_INS_PMINSW: int
UC_X86_INS_PMINUB: int
UC_X86_INS_PMOVMSKB: int
UC_X86_INS_PMULHRSW: int
UC_X86_INS_PMULHUW: int
UC_X86_INS_PMULHW: int
UC_X86_INS_PMULLW: int
UC_X86_INS_PMULUDQ: int
UC_X86_INS_POR: int
UC_X86_INS_PSADBW: int
UC_X86_INS_PSHUFB: int
UC_X86_INS_PSHUFW: int
UC_X86_INS_PSIGNB: int
UC_X86_INS_PSIGND: int
UC_X86_INS_PSIGNW: int
UC_X86_INS_PSLLD: int
UC_X86_INS_PSLLQ: int
UC_X86_INS_PSLLW: int
UC_X86_INS_PSRAD: int
UC_X86_INS_PSRAW: int
UC_X86_INS_PSRLD: int
UC_X86_INS_PSRLQ: int
UC_X86_INS_PSRLW: int
UC_X86_INS_PSUBB: int
UC_X86_INS_PSUBD: int
UC_X86_INS_PSUBQ: int
UC_X86_INS_PSUBSB: int
UC_X86_INS_PSUBSW: int
UC_X86_INS_PSUBUSB: int
UC_X86_INS_PSUBUSW: int
UC_X86_INS_PSUBW: int
UC_X86_INS_PUNPCKHBW: int
UC_X86_INS_PUNPCKHDQ: int
UC_X86_INS_PUNPCKHWD: int
UC_X86_INS_PUNPCKLBW: int
UC_X86_INS_PUNPCKLDQ: int
UC_X86_INS_PUNPCKLWD: int
UC_X86_INS_PXOR: int
UC_X86_INS_MONITOR: int
UC_X86_INS_MONTMUL: int
UC_X86_INS_MOV: int
UC_X86_INS_MOVABS: int
UC_X86_INS_MOVBE: int
UC_X86_INS_MOVDDUP: int
UC_X86_INS_MOVDQA: int
UC_X86_INS_MOVDQU: int
UC_X86_INS_MOVHLPS: int
UC_X86_INS_MOVHPD: int
UC_X86_INS_MOVHPS: int
UC_X86_INS_MOVLHPS: int
UC_X86_INS_MOVLPD: int
UC_X86_INS_MOVLPS: int
UC_X86_INS_MOVMSKPD: int
UC_X86_INS_MOVMSKPS: int
UC_X86_INS_MOVNTDQA: int
UC_X86_INS_MOVNTDQ: int
UC_X86_INS_MOVNTI: int
UC_X86_INS_MOVNTPD: int
UC_X86_INS_MOVNTPS: int
UC_X86_INS_MOVNTSD: int
UC_X86_INS_MOVNTSS: int
UC_X86_INS_MOVSB: int
UC_X86_INS_MOVSD: int
UC_X86_INS_MOVSHDUP: int
UC_X86_INS_MOVSLDUP: int
UC_X86_INS_MOVSQ: int
UC_X86_INS_MOVSS: int
UC_X86_INS_MOVSW: int
UC_X86_INS_MOVSX: int
UC_X86_INS_MOVSXD: int
UC_X86_INS_MOVUPD: int
UC_X86_INS_MOVUPS: int
UC_X86_INS_MOVZX: int
UC_X86_INS_MPSADBW: int
UC_X86_INS_MUL: int
UC_X86_INS_MULPD: int
UC_X86_INS_MULPS: int
UC_X86_INS_MULSD: int
UC_X86_INS_MULSS: int
UC_X86_INS_MULX: int
UC_X86_INS_FMUL: int
UC_X86_INS_FIMUL: int
UC_X86_INS_FMULP: int
UC_X86_INS_MWAIT: int
UC_X86_INS_NEG: int
UC_X86_INS_NOP: int
UC_X86_INS_NOT: int
UC_X86_INS_OUT: int
UC_X86_INS_OUTSB: int
UC_X86_INS_OUTSD: int
UC_X86_INS_OUTSW: int
UC_X86_INS_PACKUSDW: int
UC_X86_INS_PAUSE: int
UC_X86_INS_PAVGUSB: int
UC_X86_INS_PBLENDVB: int
UC_X86_INS_PBLENDW: int
UC_X86_INS_PCLMULQDQ: int
UC_X86_INS_PCMPEQQ: int
UC_X86_INS_PCMPESTRI: int
UC_X86_INS_PCMPESTRM: int
UC_X86_INS_PCMPGTQ: int
UC_X86_INS_PCMPISTRI: int
UC_X86_INS_PCMPISTRM: int
UC_X86_INS_PCOMMIT: int
UC_X86_INS_PDEP: int
UC_X86_INS_PEXT: int
UC_X86_INS_PEXTRB: int
UC_X86_INS_PEXTRD: int
UC_X86_INS_PEXTRQ: int
UC_X86_INS_PF2ID: int
UC_X86_INS_PF2IW: int
UC_X86_INS_PFACC: int
UC_X86_INS_PFADD: int
UC_X86_INS_PFCMPEQ: int
UC_X86_INS_PFCMPGE: int
UC_X86_INS_PFCMPGT: int
UC_X86_INS_PFMAX: int
UC_X86_INS_PFMIN: int
UC_X86_INS_PFMUL: int
UC_X86_INS_PFNACC: int
UC_X86_INS_PFPNACC: int
UC_X86_INS_PFRCPIT1: int
UC_X86_INS_PFRCPIT2: int
UC_X86_INS_PFRCP: int
UC_X86_INS_PFRSQIT1: int
UC_X86_INS_PFRSQRT: int
UC_X86_INS_PFSUBR: int
UC_X86_INS_PFSUB: int
UC_X86_INS_PHMINPOSUW: int
UC_X86_INS_PI2FD: int
UC_X86_INS_PI2FW: int
UC_X86_INS_PINSRB: int
UC_X86_INS_PINSRD: int
UC_X86_INS_PINSRQ: int
UC_X86_INS_PMAXSB: int
UC_X86_INS_PMAXSD: int
UC_X86_INS_PMAXUD: int
UC_X86_INS_PMAXUW: int
UC_X86_INS_PMINSB: int
UC_X86_INS_PMINSD: int
UC_X86_INS_PMINUD: int
UC_X86_INS_PMINUW: int
UC_X86_INS_PMOVSXBD: int
UC_X86_INS_PMOVSXBQ: int
UC_X86_INS_PMOVSXBW: int
UC_X86_INS_PMOVSXDQ: int
UC_X86_INS_PMOVSXWD: int
UC_X86_INS_PMOVSXWQ: int
UC_X86_INS_PMOVZXBD: int
UC_X86_INS_PMOVZXBQ: int
UC_X86_INS_PMOVZXBW: int
UC_X86_INS_PMOVZXDQ: int
UC_X86_INS_PMOVZXWD: int
UC_X86_INS_PMOVZXWQ: int
UC_X86_INS_PMULDQ: int
UC_X86_INS_PMULHRW: int
UC_X86_INS_PMULLD: int
UC_X86_INS_POP: int
UC_X86_INS_POPAW: int
UC_X86_INS_POPAL: int
UC_X86_INS_POPCNT: int
UC_X86_INS_POPF: int
UC_X86_INS_POPFD: int
UC_X86_INS_POPFQ: int
UC_X86_INS_PREFETCH: int
UC_X86_INS_PREFETCHNTA: int
UC_X86_INS_PREFETCHT0: int
UC_X86_INS_PREFETCHT1: int
UC_X86_INS_PREFETCHT2: int
UC_X86_INS_PREFETCHW: int
UC_X86_INS_PSHUFD: int
UC_X86_INS_PSHUFHW: int
UC_X86_INS_PSHUFLW: int
UC_X86_INS_PSLLDQ: int
UC_X86_INS_PSRLDQ: int
UC_X86_INS_PSWAPD: int
UC_X86_INS_PTEST: int
UC_X86_INS_PUNPCKHQDQ: int
UC_X86_INS_PUNPCKLQDQ: int
UC_X86_INS_PUSH: int
UC_X86_INS_PUSHAW: int
UC_X86_INS_PUSHAL: int
UC_X86_INS_PUSHF: int
UC_X86_INS_PUSHFD: int
UC_X86_INS_PUSHFQ: int
UC_X86_INS_RCL: int
UC_X86_INS_RCPPS: int
UC_X86_INS_RCPSS: int
UC_X86_INS_RCR: int
UC_X86_INS_RDFSBASE: int
UC_X86_INS_RDGSBASE: int
UC_X86_INS_RDMSR: int
UC_X86_INS_RDPMC: int
UC_X86_INS_RDRAND: int
UC_X86_INS_RDSEED: int
UC_X86_INS_RDTSC: int
UC_X86_INS_RDTSCP: int
UC_X86_INS_ROL: int
UC_X86_INS_ROR: int
UC_X86_INS_RORX: int
UC_X86_INS_ROUNDPD: int
UC_X86_INS_ROUNDPS: int
UC_X86_INS_ROUNDSD: int
UC_X86_INS_ROUNDSS: int
UC_X86_INS_RSM: int
UC_X86_INS_RSQRTPS: int
UC_X86_INS_RSQRTSS: int
UC_X86_INS_SAHF: int
UC_X86_INS_SAL: int
UC_X86_INS_SALC: int
UC_X86_INS_SAR: int
UC_X86_INS_SARX: int
UC_X86_INS_SBB: int
UC_X86_INS_SCASB: int
UC_X86_INS_SCASD: int
UC_X86_INS_SCASQ: int
UC_X86_INS_SCASW: int
UC_X86_INS_SETAE: int
UC_X86_INS_SETA: int
UC_X86_INS_SETBE: int
UC_X86_INS_SETB: int
UC_X86_INS_SETE: int
UC_X86_INS_SETGE: int
UC_X86_INS_SETG: int
UC_X86_INS_SETLE: int
UC_X86_INS_SETL: int
UC_X86_INS_SETNE: int
UC_X86_INS_SETNO: int
UC_X86_INS_SETNP: int
UC_X86_INS_SETNS: int
UC_X86_INS_SETO: int
UC_X86_INS_SETP: int
UC_X86_INS_SETS: int
UC_X86_INS_SFENCE: int
UC_X86_INS_SGDT: int
UC_X86_INS_SHA1MSG1: int
UC_X86_INS_SHA1MSG2: int
UC_X86_INS_SHA1NEXTE: int
UC_X86_INS_SHA1RNDS4: int
UC_X86_INS_SHA256MSG1: int
UC_X86_INS_SHA256MSG2: int
UC_X86_INS_SHA256RNDS2: int
UC_X86_INS_SHL: int
UC_X86_INS_SHLD: int
UC_X86_INS_SHLX: int
UC_X86_INS_SHR: int
UC_X86_INS_SHRD: int
UC_X86_INS_SHRX: int
UC_X86_INS_SHUFPD: int
UC_X86_INS_SHUFPS: int
UC_X86_INS_SIDT: int
UC_X86_INS_FSIN: int
UC_X86_INS_SKINIT: int
UC_X86_INS_SLDT: int
UC_X86_INS_SMSW: int
UC_X86_INS_SQRTPD: int
UC_X86_INS_SQRTPS: int
UC_X86_INS_SQRTSD: int
UC_X86_INS_SQRTSS: int
UC_X86_INS_FSQRT: int
UC_X86_INS_STAC: int
UC_X86_INS_STC: int
UC_X86_INS_STD: int
UC_X86_INS_STGI: int
UC_X86_INS_STI: int
UC_X86_INS_STMXCSR: int
UC_X86_INS_STOSB: int
UC_X86_INS_STOSD: int
UC_X86_INS_STOSQ: int
UC_X86_INS_STOSW: int
UC_X86_INS_STR: int
UC_X86_INS_FST: int
UC_X86_INS_FSTP: int
UC_X86_INS_FSTPNCE: int
UC_X86_INS_FXCH: int
UC_X86_INS_SUBPD: int
UC_X86_INS_SUBPS: int
UC_X86_INS_FSUBR: int
UC_X86_INS_FISUBR: int
UC_X86_INS_FSUBRP: int
UC_X86_INS_SUBSD: int
UC_X86_INS_SUBSS: int
UC_X86_INS_FSUB: int
UC_X86_INS_FISUB: int
UC_X86_INS_FSUBP: int
UC_X86_INS_SWAPGS: int
UC_X86_INS_SYSCALL: int
UC_X86_INS_SYSENTER: int
UC_X86_INS_SYSEXIT: int
UC_X86_INS_SYSRET: int
UC_X86_INS_T1MSKC: int
UC_X86_INS_TEST: int
UC_X86_INS_UD2: int
UC_X86_INS_FTST: int
UC_X86_INS_TZCNT: int
UC_X86_INS_TZMSK: int
UC_X86_INS_FUCOMPI: int
UC_X86_INS_FUCOMI: int
UC_X86_INS_FUCOMPP: int
UC_X86_INS_FUCOMP: int
UC_X86_INS_FUCOM: int
UC_X86_INS_UD2B: int
UC_X86_INS_UNPCKHPD: int
UC_X86_INS_UNPCKHPS: int
UC_X86_INS_UNPCKLPD: int
UC_X86_INS_UNPCKLPS: int
UC_X86_INS_VADDPD: int
UC_X86_INS_VADDPS: int
UC_X86_INS_VADDSD: int
UC_X86_INS_VADDSS: int
UC_X86_INS_VADDSUBPD: int
UC_X86_INS_VADDSUBPS: int
UC_X86_INS_VAESDECLAST: int
UC_X86_INS_VAESDEC: int
UC_X86_INS_VAESENCLAST: int
UC_X86_INS_VAESENC: int
UC_X86_INS_VAESIMC: int
UC_X86_INS_VAESKEYGENASSIST: int
UC_X86_INS_VALIGND: int
UC_X86_INS_VALIGNQ: int
UC_X86_INS_VANDNPD: int
UC_X86_INS_VANDNPS: int
UC_X86_INS_VANDPD: int
UC_X86_INS_VANDPS: int
UC_X86_INS_VBLENDMPD: int
UC_X86_INS_VBLENDMPS: int
UC_X86_INS_VBLENDPD: int
UC_X86_INS_VBLENDPS: int
UC_X86_INS_VBLENDVPD: int
UC_X86_INS_VBLENDVPS: int
UC_X86_INS_VBROADCASTF128: int
UC_X86_INS_VBROADCASTI32X4: int
UC_X86_INS_VBROADCASTI64X4: int
UC_X86_INS_VBROADCASTSD: int
UC_X86_INS_VBROADCASTSS: int
UC_X86_INS_VCMPPD: int
UC_X86_INS_VCMPPS: int
UC_X86_INS_VCMPSD: int
UC_X86_INS_VCMPSS: int
UC_X86_INS_VCOMPRESSPD: int
UC_X86_INS_VCOMPRESSPS: int
UC_X86_INS_VCVTDQ2PD: int
UC_X86_INS_VCVTDQ2PS: int
UC_X86_INS_VCVTPD2DQX: int
UC_X86_INS_VCVTPD2DQ: int
UC_X86_INS_VCVTPD2PSX: int
UC_X86_INS_VCVTPD2PS: int
UC_X86_INS_VCVTPD2UDQ: int
UC_X86_INS_VCVTPH2PS: int
UC_X86_INS_VCVTPS2DQ: int
UC_X86_INS_VCVTPS2PD: int
UC_X86_INS_VCVTPS2PH: int
UC_X86_INS_VCVTPS2UDQ: int
UC_X86_INS_VCVTSD2SI: int
UC_X86_INS_VCVTSD2USI: int
UC_X86_INS_VCVTSS2SI: int
UC_X86_INS_VCVTSS2USI: int
UC_X86_INS_VCVTTPD2DQX: int
UC_X86_INS_VCVTTPD2DQ: int
UC_X86_INS_VCVTTPD2UDQ: int
UC_X86_INS_VCVTTPS2DQ: int
UC_X86_INS_VCVTTPS2UDQ: int
UC_X86_INS_VCVTUDQ2PD: int
UC_X86_INS_VCVTUDQ2PS: int
UC_X86_INS_VDIVPD: int
UC_X86_INS_VDIVPS: int
UC_X86_INS_VDIVSD: int
UC_X86_INS_VDIVSS: int
UC_X86_INS_VDPPD: int
UC_X86_INS_VDPPS: int
UC_X86_INS_VERR: int
UC_X86_INS_VERW: int
UC_X86_INS_VEXP2PD: int
UC_X86_INS_VEXP2PS: int
UC_X86_INS_VEXPANDPD: int
UC_X86_INS_VEXPANDPS: int
UC_X86_INS_VEXTRACTF128: int
UC_X86_INS_VEXTRACTF32X4: int
UC_X86_INS_VEXTRACTF64X4: int
UC_X86_INS_VEXTRACTI128: int
UC_X86_INS_VEXTRACTI32X4: int
UC_X86_INS_VEXTRACTI64X4: int
UC_X86_INS_VEXTRACTPS: int
UC_X86_INS_VFMADD132PD: int
UC_X86_INS_VFMADD132PS: int
UC_X86_INS_VFMADDPD: int
UC_X86_INS_VFMADD213PD: int
UC_X86_INS_VFMADD231PD: int
UC_X86_INS_VFMADDPS: int
UC_X86_INS_VFMADD213PS: int
UC_X86_INS_VFMADD231PS: int
UC_X86_INS_VFMADDSD: int
UC_X86_INS_VFMADD213SD: int
UC_X86_INS_VFMADD132SD: int
UC_X86_INS_VFMADD231SD: int
UC_X86_INS_VFMADDSS: int
UC_X86_INS_VFMADD213SS: int
UC_X86_INS_VFMADD132SS: int
UC_X86_INS_VFMADD231SS: int
UC_X86_INS_VFMADDSUB132PD: int
UC_X86_INS_VFMADDSUB132PS: int
UC_X86_INS_VFMADDSUBPD: int
UC_X86_INS_VFMADDSUB213PD: int
UC_X86_INS_VFMADDSUB231PD: int
UC_X86_INS_VFMADDSUBPS: int
UC_X86_INS_VFMADDSUB213PS: int
UC_X86_INS_VFMADDSUB231PS: int
UC_X86_INS_VFMSUB132PD: int
UC_X86_INS_VFMSUB132PS: int
UC_X86_INS_VFMSUBADD132PD: int
UC_X86_INS_VFMSUBADD132PS: int
UC_X86_INS_VFMSUBADDPD: int
UC_X86_INS_VFMSUBADD213PD: int
UC_X86_INS_VFMSUBADD231PD: int
UC_X86_INS_VFMSUBADDPS: int
UC_X86_INS_VFMSUBADD213PS: int
UC_X86_INS_VFMSUBADD231PS: int
UC_X86_INS_VFMSUBPD: int
UC_X86_INS_VFMSUB213PD: int
UC_X86_INS_VFMSUB231PD: int
UC_X86_INS_VFMSUBPS: int
UC_X86_INS_VFMSUB213PS: int
UC_X86_INS_VFMSUB231PS: int
UC_X86_INS_VFMSUBSD: int
UC_X86_INS_VFMSUB213SD: int
UC_X86_INS_VFMSUB132SD: int
UC_X86_INS_VFMSUB231SD: int
UC_X86_INS_VFMSUBSS: int
UC_X86_INS_VFMSUB213SS: int
UC_X86_INS_VFMSUB132SS: int
UC_X86_INS_VFMSUB231SS: int
UC_X86_INS_VFNMADD132PD: int
UC_X86_INS_VFNMADD132PS: int
UC_X86_INS_VFNMADDPD: int
UC_X86_INS_VFNMADD213PD: int
UC_X86_INS_VFNMADD231PD: int
UC_X86_INS_VFNMADDPS: int
UC_X86_INS_VFNMADD213PS: int
UC_X86_INS_VFNMADD231PS: int
UC_X86_INS_VFNMADDSD: int
UC_X86_INS_VFNMADD213SD: int
UC_X86_INS_VFNMADD132SD: int
UC_X86_INS_VFNMADD231SD: int
UC_X86_INS_VFNMADDSS: int
UC_X86_INS_VFNMADD213SS: int
UC_X86_INS_VFNMADD132SS: int
UC_X86_INS_VFNMADD231SS: int
UC_X86_INS_VFNMSUB132PD: int
UC_X86_INS_VFNMSUB132PS: int
UC_X86_INS_VFNMSUBPD: int
UC_X86_INS_VFNMSUB213PD: int
UC_X86_INS_VFNMSUB231PD: int
UC_X86_INS_VFNMSUBPS: int
UC_X86_INS_VFNMSUB213PS: int
UC_X86_INS_VFNMSUB231PS: int
UC_X86_INS_VFNMSUBSD: int
UC_X86_INS_VFNMSUB213SD: int
UC_X86_INS_VFNMSUB132SD: int
UC_X86_INS_VFNMSUB231SD: int
UC_X86_INS_VFNMSUBSS: int
UC_X86_INS_VFNMSUB213SS: int
UC_X86_INS_VFNMSUB132SS: int
UC_X86_INS_VFNMSUB231SS: int
UC_X86_INS_VFRCZPD: int
UC_X86_INS_VFRCZPS: int
UC_X86_INS_VFRCZSD: int
UC_X86_INS_VFRCZSS: int
UC_X86_INS_VORPD: int
UC_X86_INS_VORPS: int
UC_X86_INS_VXORPD: int
UC_X86_INS_VXORPS: int
UC_X86_INS_VGATHERDPD: int
UC_X86_INS_VGATHERDPS: int
UC_X86_INS_VGATHERPF0DPD: int
UC_X86_INS_VGATHERPF0DPS: int
UC_X86_INS_VGATHERPF0QPD: int
UC_X86_INS_VGATHERPF0QPS: int
UC_X86_INS_VGATHERPF1DPD: int
UC_X86_INS_VGATHERPF1DPS: int
UC_X86_INS_VGATHERPF1QPD: int
UC_X86_INS_VGATHERPF1QPS: int
UC_X86_INS_VGATHERQPD: int
UC_X86_INS_VGATHERQPS: int
UC_X86_INS_VHADDPD: int
UC_X86_INS_VHADDPS: int
UC_X86_INS_VHSUBPD: int
UC_X86_INS_VHSUBPS: int
UC_X86_INS_VINSERTF128: int
UC_X86_INS_VINSERTF32X4: int
UC_X86_INS_VINSERTF32X8: int
UC_X86_INS_VINSERTF64X2: int
UC_X86_INS_VINSERTF64X4: int
UC_X86_INS_VINSERTI128: int
UC_X86_INS_VINSERTI32X4: int
UC_X86_INS_VINSERTI32X8: int
UC_X86_INS_VINSERTI64X2: int
UC_X86_INS_VINSERTI64X4: int
UC_X86_INS_VINSERTPS: int
UC_X86_INS_VLDDQU: int
UC_X86_INS_VLDMXCSR: int
UC_X86_INS_VMASKMOVDQU: int
UC_X86_INS_VMASKMOVPD: int
UC_X86_INS_VMASKMOVPS: int
UC_X86_INS_VMAXPD: int
UC_X86_INS_VMAXPS: int
UC_X86_INS_VMAXSD: int
UC_X86_INS_VMAXSS: int
UC_X86_INS_VMCALL: int
UC_X86_INS_VMCLEAR: int
UC_X86_INS_VMFUNC: int
UC_X86_INS_VMINPD: int
UC_X86_INS_VMINPS: int
UC_X86_INS_VMINSD: int
UC_X86_INS_VMINSS: int
UC_X86_INS_VMLAUNCH: int
UC_X86_INS_VMLOAD: int
UC_X86_INS_VMMCALL: int
UC_X86_INS_VMOVQ: int
UC_X86_INS_VMOVDDUP: int
UC_X86_INS_VMOVD: int
UC_X86_INS_VMOVDQA32: int
UC_X86_INS_VMOVDQA64: int
UC_X86_INS_VMOVDQA: int
UC_X86_INS_VMOVDQU16: int
UC_X86_INS_VMOVDQU32: int
UC_X86_INS_VMOVDQU64: int
UC_X86_INS_VMOVDQU8: int
UC_X86_INS_VMOVDQU: int
UC_X86_INS_VMOVHLPS: int
UC_X86_INS_VMOVHPD: int
UC_X86_INS_VMOVHPS: int
UC_X86_INS_VMOVLHPS: int
UC_X86_INS_VMOVLPD: int
UC_X86_INS_VMOVLPS: int
UC_X86_INS_VMOVMSKPD: int
UC_X86_INS_VMOVMSKPS: int
UC_X86_INS_VMOVNTDQA: int
UC_X86_INS_VMOVNTDQ: int
UC_X86_INS_VMOVNTPD: int
UC_X86_INS_VMOVNTPS: int
UC_X86_INS_VMOVSD: int
UC_X86_INS_VMOVSHDUP: int
UC_X86_INS_VMOVSLDUP: int
UC_X86_INS_VMOVSS: int
UC_X86_INS_VMOVUPD: int
UC_X86_INS_VMOVUPS: int
UC_X86_INS_VMPSADBW: int
UC_X86_INS_VMPTRLD: int
UC_X86_INS_VMPTRST: int
UC_X86_INS_VMREAD: int
UC_X86_INS_VMRESUME: int
UC_X86_INS_VMRUN: int
UC_X86_INS_VMSAVE: int
UC_X86_INS_VMULPD: int
UC_X86_INS_VMULPS: int
UC_X86_INS_VMULSD: int
UC_X86_INS_VMULSS: int
UC_X86_INS_VMWRITE: int
UC_X86_INS_VMXOFF: int
UC_X86_INS_VMXON: int
UC_X86_INS_VPABSB: int
UC_X86_INS_VPABSD: int
UC_X86_INS_VPABSQ: int
UC_X86_INS_VPABSW: int
UC_X86_INS_VPACKSSDW: int
UC_X86_INS_VPACKSSWB: int
UC_X86_INS_VPACKUSDW: int
UC_X86_INS_VPACKUSWB: int
UC_X86_INS_VPADDB: int
UC_X86_INS_VPADDD: int
UC_X86_INS_VPADDQ: int
UC_X86_INS_VPADDSB: int
UC_X86_INS_VPADDSW: int
UC_X86_INS_VPADDUSB: int
UC_X86_INS_VPADDUSW: int
UC_X86_INS_VPADDW: int
UC_X86_INS_VPALIGNR: int
UC_X86_INS_VPANDD: int
UC_X86_INS_VPANDND: int
UC_X86_INS_VPANDNQ: int
UC_X86_INS_VPANDN: int
UC_X86_INS_VPANDQ: int
UC_X86_INS_VPAND: int
UC_X86_INS_VPAVGB: int
UC_X86_INS_VPAVGW: int
UC_X86_INS_VPBLENDD: int
UC_X86_INS_VPBLENDMB: int
UC_X86_INS_VPBLENDMD: int
UC_X86_INS_VPBLENDMQ: int
UC_X86_INS_VPBLENDMW: int
UC_X86_INS_VPBLENDVB: int
UC_X86_INS_VPBLENDW: int
UC_X86_INS_VPBROADCASTB: int
UC_X86_INS_VPBROADCASTD: int
UC_X86_INS_VPBROADCASTMB2Q: int
UC_X86_INS_VPBROADCASTMW2D: int
UC_X86_INS_VPBROADCASTQ: int
UC_X86_INS_VPBROADCASTW: int
UC_X86_INS_VPCLMULQDQ: int
UC_X86_INS_VPCMOV: int
UC_X86_INS_VPCMPB: int
UC_X86_INS_VPCMPD: int
UC_X86_INS_VPCMPEQB: int
UC_X86_INS_VPCMPEQD: int
UC_X86_INS_VPCMPEQQ: int
UC_X86_INS_VPCMPEQW: int
UC_X86_INS_VPCMPESTRI: int
UC_X86_INS_VPCMPESTRM: int
UC_X86_INS_VPCMPGTB: int
UC_X86_INS_VPCMPGTD: int
UC_X86_INS_VPCMPGTQ: int
UC_X86_INS_VPCMPGTW: int
UC_X86_INS_VPCMPISTRI: int
UC_X86_INS_VPCMPISTRM: int
UC_X86_INS_VPCMPQ: int
UC_X86_INS_VPCMPUB: int
UC_X86_INS_VPCMPUD: int
UC_X86_INS_VPCMPUQ: int
UC_X86_INS_VPCMPUW: int
UC_X86_INS_VPCMPW: int
UC_X86_INS_VPCOMB: int
UC_X86_INS_VPCOMD: int
UC_X86_INS_VPCOMPRESSD: int
UC_X86_INS_VPCOMPRESSQ: int
UC_X86_INS_VPCOMQ: int
UC_X86_INS_VPCOMUB: int
UC_X86_INS_VPCOMUD: int
UC_X86_INS_VPCOMUQ: int
UC_X86_INS_VPCOMUW: int
UC_X86_INS_VPCOMW: int
UC_X86_INS_VPCONFLICTD: int
UC_X86_INS_VPCONFLICTQ: int
UC_X86_INS_VPERM2F128: int
UC_X86_INS_VPERM2I128: int
UC_X86_INS_VPERMD: int
UC_X86_INS_VPERMI2D: int
UC_X86_INS_VPERMI2PD: int
UC_X86_INS_VPERMI2PS: int
UC_X86_INS_VPERMI2Q: int
UC_X86_INS_VPERMIL2PD: int
UC_X86_INS_VPERMIL2PS: int
UC_X86_INS_VPERMILPD: int
UC_X86_INS_VPERMILPS: int
UC_X86_INS_VPERMPD: int
UC_X86_INS_VPERMPS: int
UC_X86_INS_VPERMQ: int
UC_X86_INS_VPERMT2D: int
UC_X86_INS_VPERMT2PD: int
UC_X86_INS_VPERMT2PS: int
UC_X86_INS_VPERMT2Q: int
UC_X86_INS_VPEXPANDD: int
UC_X86_INS_VPEXPANDQ: int
UC_X86_INS_VPEXTRB: int
UC_X86_INS_VPEXTRD: int
UC_X86_INS_VPEXTRQ: int
UC_X86_INS_VPEXTRW: int
UC_X86_INS_VPGATHERDD: int
UC_X86_INS_VPGATHERDQ: int
UC_X86_INS_VPGATHERQD: int
UC_X86_INS_VPGATHERQQ: int
UC_X86_INS_VPHADDBD: int
UC_X86_INS_VPHADDBQ: int
UC_X86_INS_VPHADDBW: int
UC_X86_INS_VPHADDDQ: int
UC_X86_INS_VPHADDD: int
UC_X86_INS_VPHADDSW: int
UC_X86_INS_VPHADDUBD: int
UC_X86_INS_VPHADDUBQ: int
UC_X86_INS_VPHADDUBW: int
UC_X86_INS_VPHADDUDQ: int
UC_X86_INS_VPHADDUWD: int
UC_X86_INS_VPHADDUWQ: int
UC_X86_INS_VPHADDWD: int
UC_X86_INS_VPHADDWQ: int
UC_X86_INS_VPHADDW: int
UC_X86_INS_VPHMINPOSUW: int
UC_X86_INS_VPHSUBBW: int
UC_X86_INS_VPHSUBDQ: int
UC_X86_INS_VPHSUBD: int
UC_X86_INS_VPHSUBSW: int
UC_X86_INS_VPHSUBWD: int
UC_X86_INS_VPHSUBW: int
UC_X86_INS_VPINSRB: int
UC_X86_INS_VPINSRD: int
UC_X86_INS_VPINSRQ: int
UC_X86_INS_VPINSRW: int
UC_X86_INS_VPLZCNTD: int
UC_X86_INS_VPLZCNTQ: int
UC_X86_INS_VPMACSDD: int
UC_X86_INS_VPMACSDQH: int
UC_X86_INS_VPMACSDQL: int
UC_X86_INS_VPMACSSDD: int
UC_X86_INS_VPMACSSDQH: int
UC_X86_INS_VPMACSSDQL: int
UC_X86_INS_VPMACSSWD: int
UC_X86_INS_VPMACSSWW: int
UC_X86_INS_VPMACSWD: int
UC_X86_INS_VPMACSWW: int
UC_X86_INS_VPMADCSSWD: int
UC_X86_INS_VPMADCSWD: int
UC_X86_INS_VPMADDUBSW: int
UC_X86_INS_VPMADDWD: int
UC_X86_INS_VPMASKMOVD: int
UC_X86_INS_VPMASKMOVQ: int
UC_X86_INS_VPMAXSB: int
UC_X86_INS_VPMAXSD: int
UC_X86_INS_VPMAXSQ: int
UC_X86_INS_VPMAXSW: int
UC_X86_INS_VPMAXUB: int
UC_X86_INS_VPMAXUD: int
UC_X86_INS_VPMAXUQ: int
UC_X86_INS_VPMAXUW: int
UC_X86_INS_VPMINSB: int
UC_X86_INS_VPMINSD: int
UC_X86_INS_VPMINSQ: int
UC_X86_INS_VPMINSW: int
UC_X86_INS_VPMINUB: int
UC_X86_INS_VPMINUD: int
UC_X86_INS_VPMINUQ: int
UC_X86_INS_VPMINUW: int
UC_X86_INS_VPMOVDB: int
UC_X86_INS_VPMOVDW: int
UC_X86_INS_VPMOVM2B: int
UC_X86_INS_VPMOVM2D: int
UC_X86_INS_VPMOVM2Q: int
UC_X86_INS_VPMOVM2W: int
UC_X86_INS_VPMOVMSKB: int
UC_X86_INS_VPMOVQB: int
UC_X86_INS_VPMOVQD: int
UC_X86_INS_VPMOVQW: int
UC_X86_INS_VPMOVSDB: int
UC_X86_INS_VPMOVSDW: int
UC_X86_INS_VPMOVSQB: int
UC_X86_INS_VPMOVSQD: int
UC_X86_INS_VPMOVSQW: int
UC_X86_INS_VPMOVSXBD: int
UC_X86_INS_VPMOVSXBQ: int
UC_X86_INS_VPMOVSXBW: int
UC_X86_INS_VPMOVSXDQ: int
UC_X86_INS_VPMOVSXWD: int
UC_X86_INS_VPMOVSXWQ: int
UC_X86_INS_VPMOVUSDB: int
UC_X86_INS_VPMOVUSDW: int
UC_X86_INS_VPMOVUSQB: int
UC_X86_INS_VPMOVUSQD: int
UC_X86_INS_VPMOVUSQW: int
UC_X86_INS_VPMOVZXBD: int
UC_X86_INS_VPMOVZXBQ: int
UC_X86_INS_VPMOVZXBW: int
UC_X86_INS_VPMOVZXDQ: int
UC_X86_INS_VPMOVZXWD: int
UC_X86_INS_VPMOVZXWQ: int
UC_X86_INS_VPMULDQ: int
UC_X86_INS_VPMULHRSW: int
UC_X86_INS_VPMULHUW: int
UC_X86_INS_VPMULHW: int
UC_X86_INS_VPMULLD: int
UC_X86_INS_VPMULLQ: int
UC_X86_INS_VPMULLW: int
UC_X86_INS_VPMULUDQ: int
UC_X86_INS_VPORD: int
UC_X86_INS_VPORQ: int
UC_X86_INS_VPOR: int
UC_X86_INS_VPPERM: int
UC_X86_INS_VPROTB: int
UC_X86_INS_VPROTD: int
UC_X86_INS_VPROTQ: int
UC_X86_INS_VPROTW: int
UC_X86_INS_VPSADBW: int
UC_X86_INS_VPSCATTERDD: int
UC_X86_INS_VPSCATTERDQ: int
UC_X86_INS_VPSCATTERQD: int
UC_X86_INS_VPSCATTERQQ: int
UC_X86_INS_VPSHAB: int
UC_X86_INS_VPSHAD: int
UC_X86_INS_VPSHAQ: int
UC_X86_INS_VPSHAW: int
UC_X86_INS_VPSHLB: int
UC_X86_INS_VPSHLD: int
UC_X86_INS_VPSHLQ: int
UC_X86_INS_VPSHLW: int
UC_X86_INS_VPSHUFB: int
UC_X86_INS_VPSHUFD: int
UC_X86_INS_VPSHUFHW: int
UC_X86_INS_VPSHUFLW: int
UC_X86_INS_VPSIGNB: int
UC_X86_INS_VPSIGND: int
UC_X86_INS_VPSIGNW: int
UC_X86_INS_VPSLLDQ: int
UC_X86_INS_VPSLLD: int
UC_X86_INS_VPSLLQ: int
UC_X86_INS_VPSLLVD: int
UC_X86_INS_VPSLLVQ: int
UC_X86_INS_VPSLLW: int
UC_X86_INS_VPSRAD: int
UC_X86_INS_VPSRAQ: int
UC_X86_INS_VPSRAVD: int
UC_X86_INS_VPSRAVQ: int
UC_X86_INS_VPSRAW: int
UC_X86_INS_VPSRLDQ: int
UC_X86_INS_VPSRLD: int
UC_X86_INS_VPSRLQ: int
UC_X86_INS_VPSRLVD: int
UC_X86_INS_VPSRLVQ: int
UC_X86_INS_VPSRLW: int
UC_X86_INS_VPSUBB: int
UC_X86_INS_VPSUBD: int
UC_X86_INS_VPSUBQ: int
UC_X86_INS_VPSUBSB: int
UC_X86_INS_VPSUBSW: int
UC_X86_INS_VPSUBUSB: int
UC_X86_INS_VPSUBUSW: int
UC_X86_INS_VPSUBW: int
UC_X86_INS_VPTESTMD: int
UC_X86_INS_VPTESTMQ: int
UC_X86_INS_VPTESTNMD: int
UC_X86_INS_VPTESTNMQ: int
UC_X86_INS_VPTEST: int
UC_X86_INS_VPUNPCKHBW: int
UC_X86_INS_VPUNPCKHDQ: int
UC_X86_INS_VPUNPCKHQDQ: int
UC_X86_INS_VPUNPCKHWD: int
UC_X86_INS_VPUNPCKLBW: int
UC_X86_INS_VPUNPCKLDQ: int
UC_X86_INS_VPUNPCKLQDQ: int
UC_X86_INS_VPUNPCKLWD: int
UC_X86_INS_VPXORD: int
UC_X86_INS_VPXORQ: int
UC_X86_INS_VPXOR: int
UC_X86_INS_VRCP14PD: int
UC_X86_INS_VRCP14PS: int
UC_X86_INS_VRCP14SD: int
UC_X86_INS_VRCP14SS: int
UC_X86_INS_VRCP28PD: int
UC_X86_INS_VRCP28PS: int
UC_X86_INS_VRCP28SD: int
UC_X86_INS_VRCP28SS: int
UC_X86_INS_VRCPPS: int
UC_X86_INS_VRCPSS: int
UC_X86_INS_VRNDSCALEPD: int
UC_X86_INS_VRNDSCALEPS: int
UC_X86_INS_VRNDSCALESD: int
UC_X86_INS_VRNDSCALESS: int
UC_X86_INS_VROUNDPD: int
UC_X86_INS_VROUNDPS: int
UC_X86_INS_VROUNDSD: int
UC_X86_INS_VROUNDSS: int
UC_X86_INS_VRSQRT14PD: int
UC_X86_INS_VRSQRT14PS: int
UC_X86_INS_VRSQRT14SD: int
UC_X86_INS_VRSQRT14SS: int
UC_X86_INS_VRSQRT28PD: int
UC_X86_INS_VRSQRT28PS: int
UC_X86_INS_VRSQRT28SD: int
UC_X86_INS_VRSQRT28SS: int
UC_X86_INS_VRSQRTPS: int
UC_X86_INS_VRSQRTSS: int
UC_X86_INS_VSCATTERDPD: int
UC_X86_INS_VSCATTERDPS: int
UC_X86_INS_VSCATTERPF0DPD: int
UC_X86_INS_VSCATTERPF0DPS: int
UC_X86_INS_VSCATTERPF0QPD: int
UC_X86_INS_VSCATTERPF0QPS: int
UC_X86_INS_VSCATTERPF1DPD: int
UC_X86_INS_VSCATTERPF1DPS: int
UC_X86_INS_VSCATTERPF1QPD: int
UC_X86_INS_VSCATTERPF1QPS: int
UC_X86_INS_VSCATTERQPD: int
UC_X86_INS_VSCATTERQPS: int
UC_X86_INS_VSHUFPD: int
UC_X86_INS_VSHUFPS: int
UC_X86_INS_VSQRTPD: int
UC_X86_INS_VSQRTPS: int
UC_X86_INS_VSQRTSD: int
UC_X86_INS_VSQRTSS: int
UC_X86_INS_VSTMXCSR: int
UC_X86_INS_VSUBPD: int
UC_X86_INS_VSUBPS: int
UC_X86_INS_VSUBSD: int
UC_X86_INS_VSUBSS: int
UC_X86_INS_VTESTPD: int
UC_X86_INS_VTESTPS: int
UC_X86_INS_VUNPCKHPD: int
UC_X86_INS_VUNPCKHPS: int
UC_X86_INS_VUNPCKLPD: int
UC_X86_INS_VUNPCKLPS: int
UC_X86_INS_VZEROALL: int
UC_X86_INS_VZEROUPPER: int
UC_X86_INS_WAIT: int
UC_X86_INS_WBINVD: int
UC_X86_INS_WRFSBASE: int
UC_X86_INS_WRGSBASE: int
UC_X86_INS_WRMSR: int
UC_X86_INS_XABORT: int
UC_X86_INS_XACQUIRE: int
UC_X86_INS_XBEGIN: int
UC_X86_INS_XCHG: int
UC_X86_INS_XCRYPTCBC: int
UC_X86_INS_XCRYPTCFB: int
UC_X86_INS_XCRYPTCTR: int
UC_X86_INS_XCRYPTECB: int
UC_X86_INS_XCRYPTOFB: int
UC_X86_INS_XEND: int
UC_X86_INS_XGETBV: int
UC_X86_INS_XLATB: int
UC_X86_INS_XRELEASE: int
UC_X86_INS_XRSTOR: int
UC_X86_INS_XRSTOR64: int
UC_X86_INS_XRSTORS: int
UC_X86_INS_XRSTORS64: int
UC_X86_INS_XSAVE: int
UC_X86_INS_XSAVE64: int
UC_X86_INS_XSAVEC: int
UC_X86_INS_XSAVEC64: int
UC_X86_INS_XSAVEOPT: int
UC_X86_INS_XSAVEOPT64: int
UC_X86_INS_XSAVES: int
UC_X86_INS_XSAVES64: int
UC_X86_INS_XSETBV: int
UC_X86_INS_XSHA1: int
UC_X86_INS_XSHA256: int
UC_X86_INS_XSTORE: int
UC_X86_INS_XTEST: int
UC_X86_INS_FDISI8087_NOP: int
UC_X86_INS_FENI8087_NOP: int
UC_X86_INS_ENDING: int


================================================
FILE: tests/.coveragerc
================================================
[run]
omit =
    */__init__.py
    cli.py

[report]
exclude_lines =
    pragma: no cover
    assert_never

exclude_also =
    if TYPE_CHECKING:
    def _parse_args
    def _km_write
    def _is_smt_enabled
    def _can_set_reserved
    def _is_kernel_module_installed
    def _configure_kernel_module
    def _read_trace
    def _rewind_km_output_to_end
    if not skip_setup:
    # unit_model_dr
    def _check_if_installed
    if type_id not in _TRACE_ID_TO_NAME
    .*# pylint: disable=unreachable
    .*NotImplementedError


================================================
FILE: tests/.gitignore
================================================
*.o
*.patched.asm


================================================
FILE: tests/__init__.py
================================================


================================================
FILE: tests/acceptance.bats
================================================
#!/usr/bin/env bats
# set -o errexit -o pipefail -o nounset

PRESERVE_TMP=${PRESERVE_TMP:-0}
CPU_MODEL=$(cat /proc/cpuinfo | grep "model" | head -n 1 | cut -d: -f2 | tr -d ' ')

# ------------------------------------------------------------------------------
# Helper functions
# ------------------------------------------------------------------------------
function setup() {
    VENDOR="$(lscpu | grep Vendor | awk '{print $3}')"
    ARCH="$(lscpu | grep Architecture | awk '{print $2}')"

    PROJECT_ROOT="$(cd "$(dirname "$BATS_TEST_FILENAME")/../" >/dev/null 2>&1 && pwd)"

    if [ "$ARCH" == "x86_64" ]; then
        ASM_DIR="$PROJECT_ROOT/tests/x86_tests/asm"
        CONF_DIR="$PROJECT_ROOT/tests/x86_tests/configs"
    elif [ "$ARCH" == "aarch64" ]; then
        ASM_DIR="$PROJECT_ROOT/tests/arm64/asm"
        CONF_DIR="$PROJECT_ROOT/tests/arm64/configs"
    fi

    if [ "$ARCH" == "x86_64" ]; then
        ISA="$PROJECT_ROOT/base.json"
        if [ ! -f "$ISA" ]; then
            echo "Could not find 'base.json' in $ISA"
            echo "Follow the instructions in README.md to download it, and copy into this directory."
            false
        fi
    elif [ "$ARCH" == "aarch64" ]; then
        ISA="$PROJECT_ROOT/tests/arm64/min_arm64.json"
    fi

    cli="$PROJECT_ROOT/revizor.py"
    cli_opt="python3 -OO $PROJECT_ROOT/revizor.py"
    fuzz_opt="$cli fuzz -s $ISA --save-violations f -I $CONF_DIR"

    # tmp directory for tests
    TEST_DIR=$(mktemp -d)
}

function teardown() {
    if [ "$PRESERVE_TMP" -eq 0 ]; then
        rm -rf $TEST_DIR
    fi
}

function assert_violation() {
    # Check if the given test produces a contract violation
    local cmd="$@"

    run bash -c "$cmd"
    echo "Command: $cmd"
    echo "Exit code: $status"
    echo "Output: '$output'"
    [[ "$status" -eq 1 && "$output" = *"=== Violations detected ==="* ]]
}

function assert_no_violation() {
    local cmd="$@"

    run bash -c "$cmd"
    echo "Command: $cmd"
    echo "Exit code: $status"
    echo "Output: '$output'"
    [[ "$status" -eq 0 && "$output" != *"=== Violations detected ==="* ]]
}

function assert_violation_or_arch_fail() {
    # Check if the given test produces a contract violation OR an architectural failure
    local cmd="$@"

    run bash -c "$cmd"
    echo "Command: $cmd"
    echo "Exit code: $status"
    echo "Output: '$output'"
    if [[ "$output" == *" Architectural mismatch "* ]]; then
        return
    fi

    [[ "$status" -eq 1 && "$output" = *"=== Violations detected ==="* ]]
}

function intel_only() {
    if [ "$VENDOR" != "GenuineIntel" ]; then
        skip "Intel-specific test"
    fi
}

function amd_only() {
    if [ "$VENDOR" != "AuthenticAMD" ]; then
        skip "AMD-specific test"
    fi
}

function x86_only() {
    if [ "$ARCH" != "x86_64" ]; then
        skip "x86-specific test"
    fi
}

function arm_only() {
    if [ "$ARCH" != "aarch64" ]; then
        skip "ARM-specific test"
    fi
}

# ------------------------------------------------------------------------------
# Tests
# ------------------------------------------------------------------------------

@test "Architectural Test: Model and Executor are initialized with the same values (registers)" {
    assert_no_violation "$fuzz_opt -t $ASM_DIR/model_match.asm -c $CONF_DIR/arch.yaml -i 20"
}

@test "Architectural Test: Model and Executor are initialized with the same values (memory)" {
    assert_no_violation "$fuzz_opt -t $ASM_DIR/model_match_memory.asm -c $CONF_DIR/arch.yaml -i 20"
}

@test "Architectural Test: Model and Executor are initialized with the same values (flags)" {
    assert_no_violation "$fuzz_opt -t $ASM_DIR/model_flags_match.asm -c $CONF_DIR/arch.yaml -i 20"
}

@test "Architectural Test: Model and Executor are initialized with the same values (SIMD registers)" {
    x86_only
    assert_no_violation "$fuzz_opt -t $ASM_DIR/model_match_xmm.asm -c $CONF_DIR/arch.yaml -i 20"
}

@test "Architectural Test/Unicorn: 100 Random Test Cases" {
    assert_no_violation "$fuzz_opt -c $CONF_DIR/arch.yaml -n 100 -i 10"
}

@test "Architectural Test/DR: 100 Random Test Cases" {
    x86_only
    if ! ~/.local/dynamorio/drrun -c ~/.local/dynamorio/libdr_model.so -- ls /dev/null; then
        skip "DynamoRIO is not installed"
    fi
    assert_no_violation "$fuzz_opt -c $CONF_DIR/arch-dr.yaml -n 100 -i 10"
}

@test "ArchDiff Test: 10 Random Test Cases" {
    assert_no_violation "$fuzz_opt -c $CONF_DIR/archdiff.yaml -n 10 -i 10"
}

@test "Test Basics: Sequence of direct jumps" {
    assert_no_violation "$fuzz_opt -c $CONF_DIR/ct-seq.yaml -t $ASM_DIR/direct_jumps.asm -i 100"
}

@test "Test Basics: Sequence of calls" {
    assert_no_violation "$fuzz_opt -c $CONF_DIR/ct-seq.yaml -t $ASM_DIR/calls.asm -i 100"
}

@test "Detection [spectre-type]: Spectre V1; load variant" {
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_v1.asm -c $CONF_DIR/ct-seq.yaml  -i 20"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/spectre_v1.asm -c $CONF_DIR/ct-cond.yaml -i 20"
}

@test "Detection [spectre-type]: Spectre V1; store variant" {
    intel_only
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_v1.1.asm -c $CONF_DIR/ct-seq.yaml -i 20"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/spectre_v1.1.asm -c $CONF_DIR/ct-cond.yaml -i 20"
}

@test "Detection [spectre-type]: Spectre V1; nested variant" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_v1_n2.asm -c $CONF_DIR/ct-seq.yaml -i 20"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/spectre_v1_n2.asm -c $CONF_DIR/ct-cond.yaml -i 20"
}

@test "Detection [spectre-type]: Spectre V2 (BTI)" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_v2.asm -c $CONF_DIR/ct-seq.yaml -i 10 -n 100"
}

@test "Detection [spectre-type]: Spectre V4 (SSBP)" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_v4.asm -c $CONF_DIR/ssbp-detect.yaml -i 100"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/spectre_v4.asm -c $CONF_DIR/ssbp-verif.yaml  -i 100"

    # used default config to test SSBP patch (it is enabled by default)
    assert_no_violation "$fuzz_opt -t $ASM_DIR/spectre_v4.asm -c $CONF_DIR/ct-seq.yaml -i 100"
}

@test "Detection [spectre-type]: Spectre V5 (return misprediction)" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/spectre_ret.asm -c $CONF_DIR/ct-seq.yaml -i 10"
}

@test "Detection [meltdown-type]: #DE-zero speculation" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/fault-div-zero-speculation.asm -c $CONF_DIR/div-detect.yaml -i 3"
    # assert_no_violation "$fuzz_opt -t $ASM_DIR/fault-div-zero-speculation.asm -c $CONF_DIR/div-verif.yaml -i 3"
}

@test "Detection [meltdown-type]: #DE-overflow speculation" {
    x86_only
    assert_violation "$fuzz_opt -t $ASM_DIR/fault-div-overflow-speculation.asm -c $CONF_DIR/div-detect.yaml -i 3"
    # assert_no_violation "$fuzz_opt -t $ASM_DIR/fault-div-overflow-speculation.asm -c $CONF_DIR/div-verif.yaml -i 3"
}

@test "Detection [meltdown-type]: #PF-present speculation" {
    intel_only
    if [ $CPU_MODEL -ge 140 ]; then
        skip "Meltdown is patched on Intel CPU models >= 140"
    fi
    assert_violation "$fuzz_opt -t $ASM_DIR/fault_load.asm -c $CONF_DIR/l1tf-p.yaml -i 5"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_load.asm -c $CONF_DIR/l1tf-p-verif.yaml -i 5"
}

@test "Detection [meltdown-type]: #PF-writable speculation" {
    intel_only
    if [ $CPU_MODEL -ge 140 ]; then
        skip "Meltdown is patched on Intel CPU models >= 140"
    fi
    assert_violation "$fuzz_opt -t $ASM_DIR/fault_rmw.asm -c $CONF_DIR/l1tf-p.yaml -i 5"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_rmw.asm -c $CONF_DIR/l1tf-p-verif.yaml -i 5"
}

@test "Detection [meltdown-type]: #PF-smap speculation" {
    intel_only
    if ! grep "smap" /proc/cpuinfo >/dev/null; then
        skip
    fi
    # Note: an arch. violation is expected here if SMAP is disabled in the kernel
    assert_violation_or_arch_fail "$fuzz_opt -t $ASM_DIR/fault_load.asm -c $CONF_DIR/meltdown.yaml -i 5"
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_load.asm -c $CONF_DIR/meltdown-verif.yaml -i 5"
}

@test "Sequential handling: #DB-instruction" {
    x86_only
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_INT1.asm -c $CONF_DIR/exceptions.yaml -i 100"
}

@test "Sequential handling: #BP" {
    x86_only
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_INT3.asm -c $CONF_DIR/exceptions.yaml -i 100"
}

@test "Sequential handling: #UD" {
    x86_only
    assert_no_violation "$fuzz_opt -t $ASM_DIR/fault_UD.asm -c $CONF_DIR/exceptions.yaml -i 100"
}

@test "Detection [meltdown-type]: Out-of-order Undefined Instruction Exception" {
    arm_only
    assert_violation "$fuzz_opt -t $ASM_DIR/fault_undefined_opcode.asm -c $CONF_DIR/ct-seq.yaml -i 20"
}

@test "Feature: Storing and loading test cases" {
    x86_only
    assert_no_violation "$cli_opt generate -s $ISA -c $CONF_DIR/ct-seq.yaml -w $TEST_DIR -n 1 -i 2"
    assert_no_violation "$cli_opt reproduce -s $ISA -c $CONF_DIR/ct-seq.yaml -t $TEST_DIR/tc0/program.asm -i $TEST_DIR/tc0/input*.bin"
}

@test "Architectural Test: Multi-actor test case" {
    assert_no_violation "$fuzz_opt -t $ASM_DIR/actor_switch.asm -c $CONF_DIR/arch-actors.yaml -i 20"
}

@test "Architectural Test: Fault Handling" {
    assert_no_violation "$fuzz_opt -t $ASM_DIR/macro_fault_handler.asm -c $CONF_DIR/arch-faults.yaml -i 20"
}

@test "Feature: Fault Handling" {
    local cmd="$fuzz_opt -t $ASM_DIR/macro_fault_handler.asm -c $CONF_DIR/fault-handler.yaml -i 1"
    run bash -c "$cmd"
    echo "Command: $cmd"
    echo "Exit code: $status"
    echo "Output: '$output'"
    [[ "$status" -eq 0 && "$output" = *"^.......^...^..................................................^"* ]]
}

@test "Feature: VMX/SVM" {
    x86_only
    amd_only  # see https://github.com/microsoft/side-channel-fuzzer/issues/122
    if cat /proc/cpuinfo | grep -e "vmx" -e "svm" >/dev/null; then
        echo "1" >/sys/rvzr_executor/enable_hpa_gpa_collisions
        assert_no_violation "$fuzz_opt -t $ASM_DIR/vm_switch.asm -c $CONF_DIR/vm-switch.yaml -i 20"

        # echo "Testing page table allocation..."
        # run cat /sys/rvzr_executor/dbg_guest_page_tables
        # if [ $status -ne 0 ]; then
        #     echo "Page table allocation test failed: $output"
        # fi
        [[ $status -eq 0 ]]
    else
        skip
    fi
}


================================================
FILE: tests/arm64/asm/actor_switch.asm
================================================
.section .data.main

.function_start:
    mov x0, #1

    .macro.switch.actor2.function_1:
# end of function_start
# --------------------------------------------------------------------------------------------------

.function_fin:
    .bb0:
    nop
# end of function_fin
# --------------------------------------------------------------------------------------------------

.section .data.actor2
.function_1:
    mov x1, #2

    .macro.switch.main.function_fin:
# end of function_1
# --------------------------------------------------------------------------------------------------

.test_case_exit:


================================================
FILE: tests/arm64/asm/asm_basic.asm
================================================
.section .data.main

.function_0:
.bb_0:

isb  // instrumentation

  // line with a comment

adc w11, w20, w10  // register operands
and x13, x13, #0b1111111000000     // immediate operand
add x13, x13, x20 // instrumentation
ldrh w23, [x13], #-115 // memory operand

b.ne .bb_main.1
  .bb_main.1:
    adc w1, w2, w3  // indentation
    and x20, x20, #0b1111111000000
    add x20, x20, x20
        ldrh w28, [ x20],     #-143    // extra spaces


.test_case_exit:


================================================
FILE: tests/arm64/asm/asm_multiactor.asm
================================================
.section .data.main

.function_0:
nop
nop

.section .data.guest_1
.function_1:
nop

.section .data.main
.function_2:
.bb0:
nop

// .section exit
.test_case_exit:


================================================
FILE: tests/arm64/asm/asm_symbol.asm
================================================
.section .data.main

.macro.measurement_start: nop; nop; nop

nop

.macro.measurement_end: nop; nop; nop

and x0, x0, #1

.function_1:

nop

.section .data.guest_1
.function_2:
nop


.test_case_exit:


================================================
FILE: tests/arm64/asm/calls.asm
================================================
.section .data.main
.function_0:
bl .function_1
.function_1:
bl .function_2
.function_2:
bl .function_3
.function_3:
bl .function_4
.function_4:
bl .function_5
.function_5:
bl .function_6
.function_6:
bl .function_7
.function_7:
bl .function_8
.function_8:
bl .function_9
.function_9:
bl .function_10
.function_10:
.test_case_exit:


================================================
FILE: tests/arm64/asm/direct_jumps.asm
================================================
.section .data.main
b .1
.1:
b .2
.2:
b .3
.3:
b .4
.4:
b .5
.5:
b .6
.6:
b .7
.7:
b .8
.8:
b .9
.9:
b .10
.10:
b .11
.11:
b .12
.12:
b .13
.13:
b .14
.14:
b .15
.15:
b .16
.16:
b .17
.17:
b .18
.18:
b .19
.19:
b .20
.20:
b .21
.21:
b .22
.22:
b .23
.23:
b .24
.24:
b .25
.25:
b .26
.26:
b .27
.27:
b .28
.28:
b .29
.29:
b .30
.30:
b .31
.31:
b .32
.32:
b .33
.33:
b .34
.34:
b .35
.35:
b .36
.36:
b .37
.37:
b .38
.38:
b .39
.39:
b .40
.40:
b .41
.41:
b .42
.42:
b .43
.43:
b .44
.44:
b .45
.45:
b .46
.46:
b .47
.47:
b .48
.48:
b .49
.49:
b .50
.50:
.test_case_exit:


================================================
FILE: tests/arm64/asm/fault-div-zero-speculation.asm
================================================
.section .data.main

mov x2, #1
mov x1, #0
udiv x3, x2, x1

and x3, x3, #0b1111111111111
add x3, x3, #0x100
ldr x0, [x20, x3]

.test_case_exit:


================================================
FILE: tests/arm64/asm/fault_undefined_opcode.asm
================================================
.section .data.main

// instrumentation to prevent page faults
and x0, x0, #0b1111111111111

// undefined instruction to trigger Undefined Instruction exception
udf #0

// this instruction should not be executed architecturally but may be executed transiently
ldr x1, [x20, x0]

.test_case_exit:


================================================
FILE: tests/arm64/asm/macro_fault_handler.asm
================================================
.section .data.main
.function_main_0:

ldr x0, [x20, #0x300]
mov x0, #0
brk #0x20
mov x1, #1

.macro.fault_handler:
ldr x2, [x20, #0x200]
ldr x2, [x20, #0xff8]
mov x2, #2


.test_case_exit:


================================================
FILE: tests/arm64/asm/model_flags_match.asm
================================================
.section .data.main

// base values
mov x4, #1
mov x5, #0

// flag check
csel x0, x4, x5, mi  // n == 1
csel x1, x4, x5, eq  // z == 1
csel x2, x4, x5, cs  // c == 1
csel x3, x4, x5, vs  // v == 1

.test_case_exit:


================================================
FILE: tests/arm64/asm/model_match.asm
================================================
.section .data.main

// empty - leaving initial reg values unchanged

.test_case_exit:


================================================
FILE: tests/arm64/asm/model_match_memory.asm
================================================
.section .data.main

ldr x0, [x2]  // main page
ldr x1, [x20, 4096]  // faulty page
add x0, x0, x1

ldr x1, [x20, -8]  // underflow pad
ldr x2, [x20, 4096 + 4096 + 320]  // overflow pad
add x1, x1, x2

ldr x2, [x20, 4096 + 4096]  // reg init
ldr x3, [x20, 4096 + 4096 + 48]  // patched flags
ldr x4, [x20, 4096 + 4096 + 64]  // simd init
mov x5, x20

.test_case_exit:


================================================
FILE: tests/arm64/asm/model_match_xmm.asm
================================================
.section .data.main
mov x0, v0.d[0]
mov x1, v1.d[0]
mov x2, v2.d[0]
mov x3, v3.d[0]
mov x4, v4.d[0]
mov x5, v5.d[0]
.test_case_exit:


================================================
FILE: tests/arm64/asm/spectre_v1.asm
================================================
.section .data.main
.function_main:

# reduce the entropy of x0
and x0, x0, #0b111111000000

# delay the cond. jump
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1
add x1, x1, x0
add x1, x1, #1

# reduce the entropy in x1
and x1, x1, #0b1000000

# misprediction
cmp x1, #0
b.eq .l1

.l0:
# x1 != 0
    add x2, x20, x0
    ldr x0, [x2], #0
    b .l2
.l1:
# x1 == 0
.l2:

.test_case_exit:


================================================
FILE: tests/arm64/configs/arch-actors.yaml
================================================
file: !include arch.yaml

actors:
  - actor2:
      - mode: "host"


================================================
FILE: tests/arm64/configs/arch-faults.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: architectural
enable_priming: false
inputs_per_class: 1
logging_modes:
  - info
  - dbg_violation
  # - dbg_dump_htraces
  # - dbg_dump_ctraces

program_size: 300
avg_mem_accesses: 150
max_bb_per_function: 3
min_bb_per_function: 3

faults_allowlist:
  - opcode-undefined


================================================
FILE: tests/arm64/configs/arch.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: architectural
enable_priming: false
inputs_per_class: 1
logging_modes:
  - info
  - dbg_violation
  # - dbg_dump_htraces
  # - dbg_dump_ctraces

program_size: 300
avg_mem_accesses: 150
max_bb_per_function: 3
min_bb_per_function: 3


================================================
FILE: tests/arm64/configs/archdiff.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: archdiff
enable_priming: false
inputs_per_class: 1
logging_modes:
 - info
#  - dbg_violation

program_size: 100
avg_mem_accesses: 50
max_bb_per_function: 3
min_bb_per_function: 3


================================================
FILE: tests/arm64/configs/base-and-simd-categories.yaml
================================================
instruction_categories:
  - general-arithmetic
  - general-barrier
  - general-bitwise
  - general-uncond_branch
  - general-cond_branch
  - general-comparison
  - general-condsel
  - general-dataxfer
  - general-misc


================================================
FILE: tests/arm64/configs/common.yaml
================================================
data_generator_seed: 1234567
program_generator_seed: 1234567

# Acceptance tests do not require a large sample size
executor_sample_sizes:
  - 10

# No logging
logging_modes:
  -
  # - dbg_model
  # - dbg_dump_htraces
  # - dbg_dump_ctraces


================================================
FILE: tests/arm64/configs/ct-cond.yaml
================================================
file: !include common.yaml

contract_observation_clause: ct
contract_execution_clause:
  - cond


================================================
FILE: tests/arm64/configs/ct-seq.yaml
================================================
file: !include common.yaml

contract_observation_clause: ct
contract_execution_clause:
  - seq

================================================
FILE: tests/arm64/configs/exceptions.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml

faults_allowlist:
  - debug-register
  - breakpoint
  - opcode-undefined


================================================
FILE: tests/arm64/configs/fault-handler.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml

actors:
  - main:
    - data_properties:
      - present: false


executor_mode: F+R
logging_modes:
  - dbg_dump_htraces


================================================
FILE: tests/arm64/min_arm64.json
================================================
[
  {"name": "csel", "category": "general-condsel", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": false, "comment": "standard condition (field \"cond\")", "type_": "COND", "values": [], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "signed immediate byte offset [-256-255] (field \"imm9\")", "type_": "IMM", "values": ["[-256-255]"], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "ldr", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": true, "src": true, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64},
      {"dest": false, "src": true, "comment": "signed immediate byte offset [-256-255] (field \"imm9\")", "type_": "IMM", "values": ["[-256-255]"], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "ldr", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "str", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "32-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": true, "src": false, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64},
      {"dest": false, "src": true, "comment": "signed immediate byte offset [-256-255] (field \"imm9\")", "type_": "IMM", "values": ["[-256-255]"], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "str", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "64-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": true, "src": false, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64},
      {"dest": false, "src": true, "comment": "signed immediate byte offset [-256-255] (field \"imm9\")", "type_": "IMM", "values": ["[-256-255]"], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "str", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "32-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": true, "src": false, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "str", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "64-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": true, "src": false, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "sub", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit destination general-purpose register or sp (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "64-bit source general-purpose register or sp (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "unsigned immediate [0-4095] (field \"imm12\")", "type_": "IMM", "values": ["[0-4095]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "add", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit destination general-purpose register or wsp (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "sp"]},
      {"dest": false, "src": true, "comment": "32-bit source general-purpose register or wsp (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "sp"]},
      {"dest": false, "src": true, "comment": "unsigned immediate [0-4095] (field \"imm12\")", "type_": "IMM", "values": ["[0-4095]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "add", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit destination general-purpose register or sp (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "64-bit source general-purpose register or sp (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "unsigned immediate [0-4095] (field \"imm12\")", "type_": "IMM", "values": ["[0-4095]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "add", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "add", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "adc", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]}
    ],
    "implicit_operands": []
  },
  {"name": "adc", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "sdiv", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "rd", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rm", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "sdiv", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "rd", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rm", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "udiv", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "rd", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rm", "type_": "REG", "width": 32, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "udiv", "category": "general-arithmetic", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "rd", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "rm", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "and", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "and", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "and", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit destination general-purpose register or wsp (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "sp"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "bitmask immediate (field \"imms:immr\")", "type_": "IMM", "values": ["bitmask"], "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "and", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit destination general-purpose register or sp (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "bitmask immediate (field \"n:imms:immr\")", "type_": "IMM", "values": ["bitmask"], "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "eor", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit destination general-purpose register or wsp (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31", "sp"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "bitmask immediate (field \"imms:immr\")", "type_": "IMM", "values": ["bitmask"], "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "eor", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit destination general-purpose register or sp (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31", "sp"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "bitmask immediate (field \"n:imms:immr\")", "type_": "IMM", "values": ["bitmask"], "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "eor", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": false, "src": true, "comment": "32-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "eor", "category": "general-bitwise", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rm\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "cmp", "category": "general-comparison", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": true, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "cmp", "category": "general-comparison", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "type_": "IMM", "values": ["[0-4095]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": true, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "dsb", "category": "general-barrier", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": false, "comment": "", "type_": "IMM", "values": ["sy"], "width": 1}
    ],
    "implicit_operands": []
  },
  {"name": "isb", "category": "general-barrier", "is_control_flow": false,
    "operands": [],
    "implicit_operands": []
  },
  {"name": "nop", "category": "general-misc", "is_control_flow": false,
    "operands": [],
    "implicit_operands": []
  },
  {"name": "ldrh", "category": "general-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "32-bit general-purpose register to be transferred (field \"rt\")", "type_": "REG", "width": 32, "values": ["w0", "w1", "w2", "w3", "w4", "w5", "w6", "w7", "w8", "w9", "w10", "w11", "w12", "w13", "w14", "w15", "w16", "w17", "w18", "w19", "w20", "w21", "w22", "w23", "w24", "w25", "w26", "w27", "w28", "w29", "w30", "w31"]},
      {"dest": true, "src": true, "comment": "64-bit general-purpose base register or sp (field \"rn\")", "type_": "MEM", "width": 64},
      {"dest": false, "src": true, "comment": "signed immediate byte offset [-256-255] (field \"imm9\")", "type_": "IMM", "values": ["[-256-255]"], "width": 0}
    ],
    "implicit_operands": []
  },
  {"name": "b", "category": "general-uncond_branch", "is_control_flow": true,
    "operands": [
      {"dest": false, "src": true, "comment": "label to be branched to (field imm19)", "type_": "LABEL", "values": [], "width": 0}
    ],
    "implicit_operands": [
      {"values": ["pc"], "type_": "REG", "width": 64, "src": true, "dest": false}
    ]
  },
  {"name": "b.", "category": "general-cond_branch", "is_control_flow": true,
    "operands": [
      {"dest": false, "src": false, "comment": "standard condition (field \"cond\")", "type_": "COND", "values": [], "width": 0},
      {"dest": false, "src": true, "comment": "label to be conditionally branched to (field imm19)", "type_": "LABEL", "values": [], "width": 0}
    ],
    "implicit_operands": [
      {"values": ["pc"], "type_": "REG", "width": 64, "src": true, "dest": false}
    ]
  },
  {"name": "br", "category": "general-indirect_branch", "is_control_flow": true,
    "operands": [
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "bl", "category": "general-call", "is_control_flow": true,
    "operands": [
      {"dest": false, "src": true, "comment": "addr_pcrel26", "type_": "LABEL", "width": 0, "values": []}
    ],
    "implicit_operands": [
      {"dest": false, "src": true, "type_": "REG", "width": 64, "values": ["pc"]},
      {"dest": true, "src": false, "type_": "REG", "width": 64, "values": ["x30"]}
    ]
  },
  {"name": "blr", "category": "general-call", "is_control_flow": true,
    "operands": [
      {"dest": false, "src": true, "comment": "rn", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]}
    ],
    "implicit_operands": []
  },
  {"name": "mrs", "category": "system-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "comment": "64-bit general-purpose source register (field \"rn\")", "type_": "REG", "width": 64, "values": ["nzcv"]}
    ],
    "implicit_operands": []
  },
  {"name": "mrs", "category": "system-dataxfer", "is_control_flow": false,
    "operands": [
      {"dest": true, "src": false, "comment": "64-bit general-purpose destination register (field \"rd\")", "type_": "REG", "width": 64, "values": ["x0", "x1", "x2", "x3", "x4", "x5", "x6", "x7", "x8", "x9", "x10", "x11", "x12", "x13", "x14", "x15", "x16", "x17", "x18", "x19", "x20", "x21", "x22", "x23", "x24", "x25", "x26", "x27", "x28", "x29", "x30", "x31"]},
      {"dest": false, "src": true, "type_": "REG", "width": 64, "values": ["pmevcntr0_el0", "pmevcntr1_el0", "pmevcntr2_el0", "pmevcntr3_el0"]}
    ],
    "implicit_operands": []
  },
  {"name": "brk", "category": "system-exception", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "type_": "IMM", "values": ["[0-65535]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["w", "", "", "w", "w", "", "", "", "w"]}
    ]
  },
  {"name": "udf", "category": "system-exception", "is_control_flow": false,
    "operands": [
      {"dest": false, "src": true, "type_": "IMM", "values": ["[0-65535]"], "width": 0}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "width": 0, "src": false, "dest": false, "values": ["", "", "", "", "", "", "", "", ""]}
    ]
  }
]


================================================
FILE: tests/arm64/model_common.py
================================================
"""
File: Collection of helper classes for arm64 model tests.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import List, Generator

import os
import tempfile
from pathlib import Path

from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.tc_components.test_case_data import InputData
from rvzr.isa_spec import InstructionSet
from rvzr.elf_parser import ELFParser
from rvzr.arch.arm64.target_desc import ARM64TargetDesc
from rvzr.arch.arm64.asm_parser import ARM64AsmParser
from rvzr.arch.arm64.generator import ARM64Generator
from rvzr.config import CONF

test_path = Path(__file__).resolve()
test_dir = test_path.parent

ASM_HEADER = """
.section .data.main
"""

# base addresses for calculating expected contract traces
PC0 = 0x8
MEM_BASE = 0x1000000
CODE_BASE = 0x8000
MAIN_OFFSET = 0x1000
FAULTY_OFFSET = 0x2000

MEM_DEFAULT_VALUE = 1
REG_DEFAULT_VALUE = 2
MEM_FAULTY_DEFAULT_VALUE = 3
RSP_DEFAULT_VALUE = FAULTY_OFFSET - 8


class Inst:
    """ Instruction with its size and memory address """
    text: str
    size: int
    mem_address: int
    mem_value: int
    pc_offset: int

    def __init__(self, text: str, size: int, mem_address: int, mem_value: int):
        self.text = text
        self.size = size
        self.mem_address = mem_address
        self.mem_value = mem_value
        self.pc_offset = 0


class InstList:
    """ List of instructions with their memory addresses """
    instructions: List[Inst]

    def __init__(self, instructions: List[Inst]):
        # measurement_end macro is inserted automatically at the end
        instructions.append(Inst(".macro.measurement_end:", 0, 0, 0))

        # set the pc_offset for each instruction
        self.set_offsets(instructions)
        self.instructions = instructions

    def __iter__(self) -> Generator[Inst, None, None]:
        yield from self.instructions

    def __getitem__(self, index: int) -> Inst:
        return self.instructions[index]

    @staticmethod
    def set_offsets(instructions: List[Inst]) -> None:
        """ Set the pc_offset for each instruction in a list """
        pc = 0x8
        for inst in instructions:
            inst.pc_offset = pc
            pc += inst.size

    def to_test_case(self) -> TestCaseProgram:
        """ Load a test case from the assembly string """
        min_arm64_path = test_dir / "min_arm64.json"

        asm_str = ASM_HEADER
        asm_str += "\n".join([x.text for x in self.instructions])
        asm_str += "\n.test_case_exit:\n"

        instruction_set = InstructionSet(min_arm64_path.absolute().as_posix())
        target_desc = ARM64TargetDesc()
        elf_parser = ELFParser(target_desc)
        asm_parser = ARM64AsmParser(instruction_set, target_desc)
        generator = ARM64Generator(CONF.program_generator_seed, instruction_set, target_desc,
                                   asm_parser, elf_parser)

        asm_file = tempfile.NamedTemporaryFile(delete=False)
        with open(asm_file.name, "w", encoding="utf-8") as f:
            f.write(asm_str)
        tc: TestCaseProgram = asm_parser.parse_file(asm_file.name, generator, elf_parser)
        asm_file.close()
        os.unlink(asm_file.name)
        return tc


def get_default_input() -> InputData:
    input_ = InputData()
    input_[0]['main'][0] = MEM_DEFAULT_VALUE
    input_[0]['main'][1] = MEM_DEFAULT_VALUE
    input_[0]['faulty'][0] = MEM_FAULTY_DEFAULT_VALUE
    input_[0]['faulty'][1] = MEM_FAULTY_DEFAULT_VALUE
    for i in range(0, 7):
        input_[0]['gpr'][i] = REG_DEFAULT_VALUE
    return input_


================================================
FILE: tests/arm64/unit_generators.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring
# pylint: disable=missing-class-docstring

import unittest
import tempfile
import subprocess
import os
from pathlib import Path
from copy import deepcopy

from rvzr.arch.arm64.generator import ARM64Generator, _ARM64Printer
from rvzr.arch.arm64.target_desc import ARM64TargetDesc
from rvzr.elf_parser import ELFParser
from rvzr.factory import get_program_generator, get_asm_parser
from rvzr.isa_spec import InstructionSet
from rvzr.tc_components.actor import ActorMode
from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.tc_components.test_case_binary import SymbolTableEntry
from rvzr.code_generator import assemble
from rvzr.config import CONF
from rvzr.logs import update_logging_after_config_change

CONF.instruction_set = "arm64"
test_path = Path(__file__).resolve()
test_dir = test_path.parent

ASM_OPCODE = """
.section .data.main
.long 0xd503201f
.test_case_exit:
"""


class ARM64GeneratorTest(unittest.TestCase):

    @classmethod
    def setUpClass(cls) -> None:
        CONF.logging_modes = []
        update_logging_after_config_change()

    @staticmethod
    def load_tc(asm_str: str) -> TestCaseProgram:

        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(ARM64TargetDesc())

        asm_file = tempfile.NamedTemporaryFile(delete=False)
        with open(asm_file.name, "w") as f:
            f.write(asm_str)
        tc: TestCaseProgram = asm_parser.parse_file(asm_file.name, generator, elf_parser)
        asm_file.close()
        os.unlink(asm_file.name)
        return tc

    def test_arm64_configuration(self) -> None:
        CONF.generator = "random"
        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix(),
                                         CONF.instruction_categories)
        gen = get_program_generator(CONF.program_generator_seed, instruction_set)
        self.assertEqual(gen.__class__, ARM64Generator)

    def test_arm64_all_instructions(self) -> None:
        # pylint: disable=protected-access
        # Note: This function tests internals of the generator, which is why we
        # have to disable the protected-access warning.

        asm_file = tempfile.NamedTemporaryFile("w", delete=False)
        obj_file = tempfile.NamedTemporaryFile("w", delete=False)

        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        function_generator = generator._function_generator
        tc = TestCaseProgram(asm_file.name)
        tc.assign_obj(obj_file.name)

        func = function_generator.generate_empty(".function_0", tc.find_section(name="main"))
        tc.find_section(name="main").append(func)
        printer = _ARM64Printer(ARM64TargetDesc())
        all_instructions = ['']

        # try generating instruction strings
        for bb in func:
            for instruction_spec in instruction_set.non_control_flow_specs:
                # fill up with random operand, following the spec
                inst = generator.generate_instruction(instruction_spec)
                bb.insert_after(bb.get_last(), inst)

            for instr in bb:
                instr_str = printer._instruction_to_str(instr)
                self.assertTrue(instr_str, f'Instruction {instr} was not generated.')
                all_instructions.append(instr_str + "\n")

        # apply generator passes
        for p in generator._passes:
            p.run_on_test_case(tc)

        # write the instructions to the asm file
        generator._printer.print(tc)

        # check if the generated instructions are valid
        assembly_failed = False
        try:
            assemble(tc)
        except subprocess.CalledProcessError:
            assembly_failed = True
        else:
            obj_file.close()
            os.unlink(obj_file.name)
        os.unlink(asm_file.name)

        if assembly_failed:
            self.fail("Generated invalid instruction(s)")

    def test_arm64_asm_parsing_basic(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(ARM64TargetDesc())

        asm_name = (test_dir / "asm/asm_basic.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(asm_name, generator, elf_parser)
        section = tc[0]
        functions = list(section)

        self.assertEqual(len(functions), 2)

        main = functions[0]
        self.assertEqual(main.name, ".function_0")

        self.assertEqual(len(main), 3)

        bb0 = main[1]
        bb1 = main[2]
        exit_ = main.get_exit_bb()

        self.assertEqual(bb0.successors[0], bb1)
        self.assertEqual(bb1.successors[0], exit_)

        self.assertEqual(functions[1].name, ".function_end")

    def test_arm64_asm_parsing_opcode(self) -> None:

        tc = self.load_tc(ASM_OPCODE)
        functions = list(tc[0])

        main_iter = iter(functions[0])
        bb0 = next(main_iter)
        insts = list(bb0)
        self.assertEqual(insts[0].name, "macro")
        self.assertEqual(insts[1].name, "opcode")

    def test_arm64_asm_parsing_section(self) -> None:
        prev_actors = deepcopy(CONF.get_actors_conf())
        CONF.get_actors_conf()["guest_1"] = deepcopy(CONF._actor_default)
        CONF.get_actors_conf()["guest_1"]["name"] = "guest_1"
        CONF.get_actors_conf()["guest_1"]["mode"] = "guest"
        CONF.get_actors_conf()["guest_1"]["privilege_level"] = "kernel"

        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(ARM64TargetDesc())
        name = (test_dir / "asm/asm_multiactor.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(name, generator, elf_parser)

        self.assertEqual(tc.n_actors(), 2)
        self.assertEqual(tc.find_actor(name="main").mode, ActorMode.HOST)
        self.assertEqual(tc.find_actor(name="main").get_id(), 0)
        self.assertEqual(tc.find_actor(name="guest_1").mode, ActorMode.GUEST)
        self.assertEqual(tc.find_actor(name="guest_1").get_id(), 1)

        self.assertEqual(len(tc), 2)

        sec1 = tc[0]
        self.assertEqual(len(sec1), 3)
        self.assertEqual(sec1.owner.get_id(), 0)
        self.assertTrue(sec1.owner.is_main)

        f1 = sec1[0]
        self.assertEqual(f1.name, ".function_0")
        self.assertEqual(len(f1[0]), 3)

        f2 = sec1[1]
        self.assertEqual(f2.name, ".function_2")
        self.assertEqual(len(f2[0]), 1)

        sec2 = tc[1]
        self.assertEqual(len(sec2), 1)
        self.assertEqual(sec2.owner.get_id(), 1)
        self.assertFalse(sec2.owner.is_main)

        f1 = sec2[0]
        self.assertEqual(f1.name, ".function_1")
        self.assertEqual(len(f1[0]), 1)

        CONF._actors = prev_actors

    def test_arm64_asm_parsing_symbols(self) -> None:
        prev_actors = deepcopy(CONF.get_actors_conf())
        CONF.get_actors_conf()["guest_1"] = deepcopy(CONF._actor_default)
        CONF.get_actors_conf()["guest_1"]["name"] = "guest_1"
        CONF.get_actors_conf()["guest_1"]["mode"] = "guest"
        CONF.get_actors_conf()["guest_1"]["privilege_level"] = "kernel"

        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix())

        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(ARM64TargetDesc())
        name = (test_dir / "asm/asm_symbol.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(name, generator, elf_parser)
        obj = tc.get_obj()
        symbol_table = obj.symbol_table()

        self.assertEqual(symbol_table[0], SymbolTableEntry(0, 0, 0, 0))  # function_0
        self.assertEqual(symbol_table[1], SymbolTableEntry(0, 0, 1, 0))  # measurement_start
        self.assertEqual(symbol_table[2], SymbolTableEntry(0, 0x10, 2, 0))  # measurement_end
        self.assertEqual(symbol_table[3], SymbolTableEntry(0, 0x20, 0, 1))  # function_1
        self.assertEqual(symbol_table[4], SymbolTableEntry(1, 0, 0, 2))  # function_2

        CONF._actors = prev_actors


================================================
FILE: tests/arm64/unit_isa_loader.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import unittest
from pathlib import Path

from rvzr.isa_spec import InstructionSet
from rvzr.config import CONF

test_path = Path(__file__).resolve()
test_dir = test_path.parent
CONF.instruction_set = "arm64"


class ARM64ISALoaderTest(unittest.TestCase):

    def test_loading(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_arm64.json").absolute().as_posix(),
                                         ["general-dataxfer"])
        inst_names = [i.name for i in instruction_set.instructions]
        self.assertIn("mov", inst_names)


================================================
FILE: tests/kernel_module.bats
================================================
#!/usr/bin/env bats

INPUT_SIZE=$((4096 * 3))

INPUT_META='\x00\x03\x00\x00\x00\x00\x00\x00''\x00\x00\x00\x00\x00\x00\x00\x00'

setup() {
    # get the containing directory of this file
    DIR="$(cd "$(dirname "$BATS_TEST_FILENAME")" >/dev/null 2>&1 && pwd)"
    VENDOR="$(lscpu | grep Vendor | awk '{print $3}')"
    ARCH="$(lscpu | grep Architecture | awk '{print $2}')"
}

function x86_only() {
    if [ "$ARCH" != "x86_64" ]; then
        skip "x86-only test"
    fi
}

hex2bin32() {
    local v=$1
    printf "\\\x%02x" $((v & 255)) $((v >> 8 & 255)) $((v >> 16 & 255)) $((v >> 24 & 255))
}

function load_input() {
    local create_only=$1
    local nruns=$2
    local dest_file=$3
    local header="\x01\x00\x00\x00\x00\x00\x00\x00$(hex2bin32 $nruns)\x00\x00\x00\x00"

    printf $header >$dest_file
    printf $INPUT_META >>$dest_file
    printf '%0.s\x00' $(seq 1 $INPUT_SIZE) >>$dest_file

    if [ $create_only = false ]; then
        cat $dest_file >/sys/rvzr_executor/inputs
        rm $dest_file
    fi
}

function load_test_case() {
    local create_only=$1
    local asm_file=$2
    local dest_file=$3

    if [ $ARCH == "x86_64" ]; then
        ${DIR}/scripts/create_rcbf_file.py $asm_file $dest_file x86
    else
        ${DIR}/scripts/create_rcbf_file.py $asm_file $dest_file arm64
    fi

    if [ $create_only = false ]; then
        cat $dest_file >/sys/rvzr_executor/test_case
        rm $dest_file
    fi
}

function set_default_config() {
    echo "0" >/sys/rvzr_executor/enable_dbg_gpr_mode
    echo "1" >/sys/rvzr_executor/enable_ssbp_patch
    echo "0" >/sys/rvzr_executor/enable_prefetcher
}

@test "Executor: Loading a test case" {
    printf "nop\n" >tmp.asm
    load_test_case true tmp.asm tmp.bin

    run bash -c 'cat tmp.bin > /sys/rvzr_executor/test_case'
    [ "$status" -eq 0 ]
    rm tmp.bin

    load_input true 1 input.bin
    run bash -c 'cat input.bin > /sys/rvzr_executor/inputs'
    [ "$status" -eq 0 ]
    rm input.bin

    run cat /sys/rvzr_executor/inputs
    [ "$status" -eq 0 ]
    echo "Output: $output"
    [[ "$output" -eq "1" ]]
}

@test "Executor: Tracing" {
    run taskset -c 0 cat /sys/rvzr_executor/trace
    [ "$status" -eq 0 ]
}

@test "Executor: Printing base addresses" {
    run cat /sys/rvzr_executor/print_data_base
    echo "Output: $output"
    [[ "$output" != "0" ]]
    run cat /sys/rvzr_executor/print_code_base
    echo "Output: $output"
    [[ "$output" != "0" ]]
}

@test "Executor: Controlling warmups" {
    echo "50" >/sys/rvzr_executor/warmups
    run cat /sys/rvzr_executor/warmups
    [[ "$output" -eq "50" ]]
}

@test "Executor: Controlling patches" {
    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    echo "nop" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run bash -c 'echo "1" > /sys/rvzr_executor/enable_ssbp_patch'
    [ "$status" -eq 0 ]
    run taskset -c 0 cat /sys/rvzr_executor/trace
    [ "$status" -eq 0 ]

    run bash -c 'echo "0" > /sys/rvzr_executor/enable_ssbp_patch'
    [ "$status" -eq 0 ]
    run taskset -c 0 cat /sys/rvzr_executor/trace
    [ "$status" -eq 0 ]

    run bash -c 'echo "1" > /sys/rvzr_executor/enable_prefetcher'
    [ "$status" -eq 0 ]
    run taskset -c 0 cat /sys/rvzr_executor/trace
    [ "$status" -eq 0 ]

    run bash -c 'echo "0" > /sys/rvzr_executor/enable_prefetcher'
    [ "$status" -eq 0 ]
    run taskset -c 0 cat /sys/rvzr_executor/trace
    [ "$status" -eq 0 ]
}

@test "Executor: Hardware tracing with GPR" {
    set_default_config
    echo "1" >/sys/rvzr_executor/enable_dbg_gpr_mode

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)

    if [ $ARCH == "x86_64" ]; then
        echo "mov \$1, %rax; mov \$2, %rbx; mov \$3, %rcx; mov \$4, %rdx; mov \$5, %rsi; mov \$6, %rdi;" >$tmpasm
    else
        echo "mov x0, 1; mov x1, 2; mov x2, 3; mov x3, 4; mov x4, 5; mov x5, 6;" >$tmpasm
    fi

    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"1,2,3,4,5,6"* ]]
}

@test "Executor: Hardware tracing with P+P" {
    x86_only
    set_default_config
    echo "P+P" >/sys/rvzr_executor/measurement_mode

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    echo "nop" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9223372036854775808,"* ]]

    echo "movq %r14, %rax; add \$512, %rax; movq (%rax), %rax" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9259400833873739776,"* ]]
}

@test "Executor: Hardware tracing with F+R" {
    x86_only
    set_default_config
    echo "F+R" >/sys/rvzr_executor/measurement_mode

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    echo "nop" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9223372036854775808,"* ]]

    echo "movq %r14, %rax; add \$512, %rax; movq (%rax), %rax" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9259400833873739776,"* ]]
}

@test "Executor: Hardware tracing with E+R" {
    x86_only
    set_default_config
    echo "E+R" >/sys/rvzr_executor/measurement_mode

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    echo "nop" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9223372036854775808,"* ]]

    echo "movq %r14, %rax; add \$512, %rax; movq (%rax), %rax" >$tmpasm
    load_test_case false $tmpasm $tmpbin
    load_input false 1 $tmpinput

    run taskset -c 0 cat /sys/rvzr_executor/trace
    echo "Output: $output"
    [[ "$output" == *"9259400833873739776,"* ]]
}

@test "Executor: Noise Level" {
    x86_only
    set_default_config

    # execute one dummy run to set Executor into the default config and to load the test case
    nruns=1000
    threshold=900

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    tmpresult=$(mktemp /tmp/revizor-test.XXXXXX.txt)

    echo "movq (%r14), %rax" >$tmpasm
    load_test_case true "$tmpasm" "$tmpbin"

    printf "\x01\x00\x00\x00\x00\x00\x00\x00$(hex2bin32 $nruns)\x00\x00\x00\x00" >/sys/rvzr_executor/inputs
    printf $INPUT_META >>/sys/rvzr_executor/inputs
    dd if=/dev/zero of="$tmpinput" bs=$INPUT_SIZE count=$nruns status=none
    cat $tmpinput >/sys/rvzr_executor/inputs

    run cat /sys/rvzr_executor/inputs
    [[ "$output" -eq "1" ]]

    for mode in "P+P" "F+R" "E+R"; do
        # echo $mode
        echo $mode >/sys/rvzr_executor/measurement_mode
        cat "$tmpbin" >/sys/rvzr_executor/test_case

        echo "" >$tmpresult

        # START=$(date +%s.%N)
        while true; do
            run taskset -c 0 cat /sys/rvzr_executor/trace
            [ "$status" -eq 0 ]
            echo "$output" >>$tmpresult
            if [[ "$output" == *"done"* ]]; then
                break
            fi
        done
        # END=$(date +%s.%N)
        # echo "$END - $START" | bc

        # cat $tmpresult | awk -F, '/,/{print $1}' | sort | uniq -c | sort -r -b -n
        run bash -c "cat $tmpresult | awk -F, '/,/{print \$1}' | sort | uniq -c | sort -r -b -n | awk '//{print \$1}' | head -n1"
        echo "$mode: $output"
        [ $output -ge $threshold ]
    done
    rm $tmpasm
    rm "$tmpbin"
    rm "$tmpinput"
    rm "$tmpresult"
}

@test "Executor: Noisy stores" {
    x86_only
    set_default_config

    # execute one dummy run to set Executor into the default config and to load the test case
    nruns=1000
    threshold=900

    tmpasm=$(mktemp /tmp/revizor-test.XXXXXX.asm)
    tmpbin=$(mktemp /tmp/revizor-test.XXXXXX.o)
    tmpinput=$(mktemp /tmp/revizor-test.XXXXXX.bin)
    tmpresult=$(mktemp /tmp/revizor-test.XXXXXX.txt)

    echo "movq %r14, %rax; add \$512, %rax; movq \$128, (%rax)" >$tmpasm
    load_test_case true $tmpasm $tmpbin

    printf "\x01\x00\x00\x00\x00\x00\x00\x00$(hex2bin32 $nruns)\x00\x00\x00\x00" >/sys/rvzr_executor/inputs
    printf $INPUT_META >>/sys/rvzr_executor/inputs
    dd if=/dev/zero of="$tmpinput" bs=$INPUT_SIZE count=$nruns status=none
    cat $tmpinput >/sys/rvzr_executor/inputs

    mode="P+P"
    echo $mode >/sys/rvzr_executor/measurement_mode
    cat $tmpbin >/sys/rvzr_executor/test_case

    run cat /sys/rvzr_executor/inputs
    [[ "$output" -eq "1" ]]

    echo "" >$tmpresult

    while true; do
        run taskset -c 0 cat /sys/rvzr_executor/trace
        [ "$status" -eq 0 ]
        echo "$output" >>$tmpresult
        if [[ "$output" == *"done"* ]]; then
            break
        fi
    done

    run bash -c "cat $tmpresult | awk -F, '/,/{print \$1}' | sort | uniq -c | sort -r | awk '//{print \$1}' | head -n1"
    echo "$mode: $output"
    [ $output -ge $threshold ]

    rm $tmpasm
    rm "$tmpbin"
    rm "$tmpinput"
    rm "$tmpresult"
}


================================================
FILE: tests/pre-release.sh
================================================
#!/usr/bin/env bash
# FILE: tests/pre-release.sh
#       Run all available demos to ensure that regressions on all known vulnerabilities on
#       the CPU under test

set -o errexit -o pipefail -o noclobber -o nounset
trap exit INT

SCRIPT=$(realpath $0)
SCRIPT_DIR=$(dirname $SCRIPT)

red='\033[0;31m'
green='\033[0;32m'
yellow='\033[0;33m'
reset='\033[0m'

verbose=0
work_dir=""
revizor_dir=${revizor_dir:-"$SCRIPT_DIR/.."}

# ==================================================================================================
# Command-line argument parsing
# ==================================================================================================
function print_help() {
    echo "Usage: $0 [-v] -w <work_dir>"
    echo ""
    echo "Options:"
    echo "  -v, --verbose        Enable verbose output"
    echo "  -w, --workdir        Working directory for temporary files"
}

function read_args() {
    # check for availability of getopt
    getopt --test >/dev/null && true
    if [[ $? -ne 4 ]]; then
        echo 'ERROR: getopt is not available'
        exit 1
    fi

    # List arguments
    LONGOPTS=workdir:,verbose
    OPTIONS=w:v

    # Parse output
    PARSED=$(getopt --options=$OPTIONS --longoptions=$LONGOPTS --name "$0" -- "$@") || exit 2
    eval set -- "$PARSED"

    while true; do
        case "$1" in
        -v | --verbose)
            verbose=0
            ;;
        -w | --workdir)
            work_dir=$2
            shift
            ;;
        --)
            shift
            break
            ;;
        esac
        shift
    done

    # check usage
    if [ -z "$work_dir" ]; then
        print_help
        exit 1
    fi

    # make sure that the directories and required files exist
    if [ ! -d "$work_dir" ]; then
        echo "ERROR: Could not find '$work_dir'"
    fi
    if [ ! -f "$revizor_dir/revizor.py" ]; then
        echo "ERROR: Could not find '$revizor_dir/revizor.py'"
    fi
    if [ ! -f "$revizor_dir/base.json" ]; then
        echo "ERROR: Could not find '$revizor_dir/base.json'"
    fi

    # Globals
    work_dir=$(realpath $work_dir)
    revizor="$revizor_dir/revizor.py"
    instructions="$revizor_dir/base.json"
    conf_dir="$revizor_dir/demo/"

}

# ==================================================================================================
# Patching and manipulation of configuration files
# ==================================================================================================

# array of patches to the configuration file that makes a repro config into a verification config
# the array is a map from the name of the vulnerability to the patch function
declare -A verif_patches
verif_patches["detect-v1"]="contract_execution_clause:\n  - cond"
verif_patches["detect-v1-store"]="contract_observation_clause: ct"
verif_patches["detect-v4"]="x86_executor_enable_ssbp_patch: true"

function make_verification_conf() {
    # create a version of the reproduce file that should NOT trigger a violation if
    # the violation has an expected root cause. E.g., for Spectre V1, we change the contract
    # execution clause to COND instead of SEQ, which means that violations caused by conditional
    # branches should no longer be reported by the fuzzer (i.e., become non-reproducible).

    local name=$1
    local repro_conf=$2
    local verif_conf=$3

    cp $repro_conf $verif_conf
    if [[ ! -v verif_patches[$name] ]]; then
        printf "${yellow}NO VERIFICATION PATCH AVAILABLE${reset}\n"
        return 1
    fi
    local patch=${verif_patches[$name]}
    echo -e "$patch" >>$verif_conf
    return 0
}

function disable_stat_logging() {
    local config=$1

    # disable statistics logging to avoid polluting the output
    echo "logging_modes:" >>$config
    echo "  - info" >>$config
}


function disable_all_logging() {
    local config=$1

    # disable all logging to avoid polluting the output
    echo "logging_modes: []" >>$config
}

# ==================================================================================================
# Functions
# ==================================================================================================
function prep_files_for_run() {
    local name=$1

    # remove leftovers from previous runs
    rm -rf $work_dir &>/dev/null || true
    mkdir -p $work_dir

    # check that the configuration file exists
    org_config="$conf_dir/${name}.yaml"
    if [ ! -f "$org_config" ]; then
        # templated demos have a different naming scheme
        org_config="$conf_dir/$name/config.yaml"
        if [ ! -f "$org_config" ]; then
            echo "ERROR: Could not find '$org_config'"
            exit 1
        fi
    fi

    # make a copy of the configuration file and patch it
    config="$work_dir/conf.yaml"
    cp $org_config $config
    disable_stat_logging $config

    # create a log file
    log="$work_dir/${name}-log.txt"
    rm $log &>/dev/null || true
}

function check_results() {
    # Check the output of the experiment for errors and parse the results

    # arguments
    local log=$1
    local exit_code=$2
    local expected=$3

    # output messages
    fail="${red}FAIL${reset}"
    error="${red}ERROR${reset}"
    ok="${green}PASSED${reset}"

    # check for errors
    if grep "ERROR" $log &>/dev/null; then
        printf "$error\n"
        return 1
    fi
    if grep "Error" $log &>/dev/null; then
        printf "$error\n"
        return 1
    fi
    if grep "Errno" $log &>/dev/null; then
        printf "$error\n"
        return 1
    fi

    # if no violations were found, the test failed
    if [ $exit_code -ne $expected ]; then
        printf "$fail [exit code %s != %s]\n" "$exit_code" "$expected"
        return 1
    fi

    # parse the output
    duration=$(awk '/Duration/{print $2}' $log)
    printf "$ok [%s sec]\n" "$duration"
    return 0
}


function run() {
    local name=$1
    local templated=${2:-0}

    prep_files_for_run $name

    # Print the header
    echo ""
    printf "${yellow}============================= $name =============================${reset}\n"

    # run the test
    printf "${green}+ Detect ...  ${reset}\n"
    set +e
    if [ $verbose -eq 1 ]; then set -x; fi
    if [ $templated -eq 0 ]; then
        python ${revizor} fuzz -s $instructions -c $config -I $conf_dir -i $NUM_INPUTS -n $NUM_PROGS --timeout $TIMEOUT -w "$work_dir" 2>&1 | tee "$log"
    else
        template="$conf_dir/$name/template.asm"
        python ${revizor} tfuzz -s $instructions -t $template -c $config -I $conf_dir -i $NUM_INPUTS -n $NUM_PROGS --timeout $TIMEOUT -w "$work_dir" 2>&1 | tee "$log"
    fi
    exit_code=$?
    if [ $verbose -eq 1 ]; then set +x; fi
    check_results $log $exit_code 1
    if [ $? -ne 0 ]; then return 0; fi
    set -e

    # move the violation into a dedicated dir
    vdir="$work_dir/violation*"
    if [ -d "$vdir" ]; then
        echo "ERROR: Could not find a violation directory: '$vdir'"
        exit 1
    fi

    # reproduce the violations
    printf "${green}+ Reproduce ...  ${reset}\n"
    repro_conf="$vdir/reproduce.yaml"
    disable_all_logging $repro_conf
    set +e
    if [ $verbose -eq 1 ]; then set -x; fi
    python ${revizor} reproduce -s $instructions -c $repro_conf -I $conf_dir -t $vdir/program.asm -i $(ls $vdir/input*.bin) 2>&1 | tee "$log"
    exit_code=$?
    if [ $verbose -eq 1 ]; then set +x; fi
    check_results $log $exit_code 1
    if [ $? -ne 0 ]; then return 0; fi
    set -e

    # verify that the violation has the expected root cause
    printf "${green}+ Verify ...  ${reset}\n"
    verif_conf="$work_dir/verif.yaml"
    set +e
    make_verification_conf $name $repro_conf $verif_conf
    if [ $? -ne 0 ]; then return 0; fi
    if [ $verbose -eq 1 ]; then set -x; fi
    python ${revizor} reproduce -s $instructions -c $verif_conf -I $conf_dir -t $vdir/program.asm -i $(ls $vdir/input*.bin) 2>&1 | tee "$log"
    exit_code=$?
    if [ $verbose -eq 1 ]; then set +x; fi
    check_results $log $exit_code 0
    if [ $? -ne 0 ]; then return 0; fi
    set -e
}

# ==================================================================================================
# Test configuration
NUM_INPUTS=25
NUM_PROGS=1000000000 # some large number that is never reached before the timeout
TIMEOUT=$((10 * 60 * 60))         # seconds

read_args "$@"

# Measurements
printf "Starting at $(date '+%H:%M:%S on %d.%m.%Y')\n"

run "detect-v1"
run "detect-v1-store"
run "detect-v4"

if grep -q 'E-2288G' /proc/cpuinfo; then
    run "detect-mds"
    run "detect-foreshadow"
    run "detect-zdi"
fi

if grep -q 'AMD' /proc/cpuinfo; then
    run "tsa-sq" 1
    run "tsa-l1d" 1
fi

# these two are slow to detect, thus run them last
run "detect-sco"
run "detect-v1-var"


================================================
FILE: tests/quick-test.sh
================================================
#!/usr/bin/env bash

function assert_violation() {
    local cmd="$@"
    log=$(mktemp)

    bash -c "$cmd" > $log
    status=$?
    output=$(cat $log)
    if [[ "$status" -eq 1 && "$output" = *"=== Violations detected ==="* ]]; then
        echo "Detection: OK"
    else
        echo "Detection: FAIL"
        echo "Command: $cmd"
        echo "Exit code: $status"
        echo "Output: '$output'"
        exit 1
    fi
}

function assert_no_violation() {
    local cmd="$@"

    log=$(mktemp)

    bash -c "$cmd" > $log
    status=$?
    output=$(cat $log)
    if [[ "$status" -eq 0 && "$output" != *"=== Violations detected ==="* ]]; then
        echo "Filtering: OK"
    else
        echo "Filtering: FAIL"
        echo "Command: $cmd"
        echo "Exit code: $status"
        echo "Output: '$output'"
        exit 1
    fi
}

SCRIPT_DIR=$(dirname $(realpath $0))

cmd="./revizor.py fuzz -s $SCRIPT_DIR/../base.json --save-violations f -I $SCRIPT_DIR/x86_tests/configs -t $SCRIPT_DIR/x86_tests/asm/spectre_v1.asm -c $SCRIPT_DIR/x86_tests/configs/ct-seq.yaml -i 20"
assert_violation "$cmd"

cmd="./revizor.py fuzz -s $SCRIPT_DIR/../base.json --save-violations f -I $SCRIPT_DIR/x86_tests/configs -t $SCRIPT_DIR/x86_tests/asm/spectre_v1.asm -c $SCRIPT_DIR/x86_tests/configs/ct-cond.yaml -i 20"
assert_no_violation "$cmd"


================================================
FILE: tests/runtests.sh
================================================
#!/usr/bin/env bash

AVAILABLE_STAGES=("type_check" "code_style_check" "core_unit_tests" "package_install_test"
    "km_tests" "arch_unit_tests" "acceptance_tests")

function parse_args() {
    POSITIONAL_ARGS=()
    IGNORE_ERRORS=false
    STRICT=false
    SKIP_KM_TESTS=false
    STAGE=""

    while [[ $# -gt 0 ]]; do
        case $1 in
        --strict)
            STRICT=true
            shift
            ;;
        --ignore-errors)
            IGNORE_ERRORS=true
            shift
            ;;
        --skip-km-tests)
            SKIP_KM_TESTS=true
            shift
            ;;
        --stage)
            if [ -z "$2" ]; then
                echo "Error: --stage requires an argument"
                exit 1
            fi
            STAGE="$2"
            shift 2
            ;;
        -* | --*)
            echo "Unknown option $1"
            exit 1
            ;;
        esac
    done

    if [[ -n "$STAGE" && ! " ${AVAILABLE_STAGES[@]} " =~ " ${STAGE} " ]]; then
        echo "Invalid stage: $STAGE"
        echo "Available stages: ${AVAILABLE_STAGES[*]}"
        exit 1
    fi

}

# ==================================================================================================
# Testing Stages
# ==================================================================================================
function type_check() {
    local enable_strict=$1

    echo ""
    echo "===== MyPy ====="
    cd $SCRIPT_DIR/.. || exit
    MYPYPATH=rvzr/ python3 -m mypy --strict $ALL_PY --no-warn-unused-ignores --untyped-calls-exclude=elftools
    cd - >/dev/null || exit

    if [ "$enable_strict" = true ]; then
        echo ""
        cd $SCRIPT_DIR/.. || exit
        echo "===== STRICT CHECK: MyPy (Unit Tests) ====="
        MYPYPATH=rvzr/ python3 -m mypy --strict tests/unit_*.py --no-warn-unused-ignores --untyped-calls-exclude=elftools
        MYPYPATH=rvzr/ python3 -m mypy --strict tests/x86_tests/unit_*.py --no-warn-unused-ignores --untyped-calls-exclude=elftools
        MYPYPATH=rvzr/ python3 -m mypy --strict tests/arm64/unit_*.py --no-warn-unused-ignores --untyped-calls-exclude=elftools
        cd - >/dev/null || exit
    fi

}

function code_style_check() {
    local enable_strict=$1

    echo ""
    echo "===== Code Style Checking with flake8 ====="
    cd $SCRIPT_DIR/.. || exit
    python3 -m flake8 --max-line-length 100 --ignore E402,W503 . --count --show-source --statistics
    cd - >/dev/null || exit

    if [ "$enable_strict" = true ]; then
        echo ""
        cd $SCRIPT_DIR/.. || exit
        echo "===== STRICT CHECK: PyLint ====="
        python3 -m pylint --rcfile=.pylintrc $ALL_PY
        cd - >/dev/null || exit
    fi

    echo ""
    echo "===== [DR] Code Style & Linting with clang-tidy ====="
    cd $SCRIPT_DIR/../rvzr/model_dynamorio || exit

    if [ -d "adapter/build" ] || [ -d "backend/build" ]; then
        # this test requires that libstd++-*-dev is installed on the system;
        versions=($(dpkg -l | grep libstdc++- | grep dev | awk '{print $2}' | sed 's/libstdc++-//;s/-dev//'))
        if [ ${#versions[@]} -eq 0 ]; then
            echo "[DR] No libstdc++-*-dev package found; skipping clang-tidy check"
            cd - >/dev/null || exit
            return
        fi

        if [ -d "adapter/build" ]; then
            find . -name "*.c" -or -name "*.h" | grep -v "CMakeFiles" | xargs clang-tidy --quiet -p adapter/build/ --config-file=adapter/.clang-tidy
        fi
        if [ -d "backend/build" ]; then
            find backend -name "*.cpp" -or -name "*.hpp" | grep -v "CMakeFiles" | xargs clang-tidy --quiet --use-color -p backend/build --config-file=backend/.clang-tidy
        fi
    else
        echo "[DR] No build directory for DR backend found; skipping clang-tidy check"
    fi

    cd - >/dev/null || exit
}

function core_unit_tests() {
    echo ""
    echo "===== Core Unit Tests ====="
    cd $SCRIPT_DIR/.. || exit
    python3 -m unittest tests.unit_fuzzer -v
    echo "-------------"
    python3 -m unittest tests.unit_analyser -v
    echo "-------------"
    python3 -m unittest tests.unit_docs -v
    echo "-------------"
    python3 -m unittest tests.unit_isa_loader
    echo "-------------"
    python3 -m unittest tests.unit_stats
    echo "-------------"
    python3 -m unittest tests.unit_tc_components
    echo "-------------"
    python3 -m unittest tests.unit_traces
    cd - >/dev/null || exit
}

function package_install_test() {
    echo ""
    echo "===== Package installation ====="

    # skip if no internet connection
    if ! ping -c 1 8.8.8.8 &>/dev/null; then
        echo "No internet connection, skipping package installation test"
        return
    fi

    cd $SCRIPT_DIR/.. || exit
    python3 -m pip uninstall revizor-fuzzer -y
    python3 -m build
    python3 -m pip install dist/*.whl
    cd - >/dev/null || exit
    cd $SCRIPT_DIR/ || exit
    set +e
    out=$(python3 -c "import rvzr; rvzr.cli.main()" 2>&1)
    set -e
    if [[ "$out" != *"usage: "* ]]; then
        echo "> ERROR: Package installation test failed"
        exit 1
    else
        echo "> Package installation test passed"
    fi
    cd - >/dev/null || exit
}

function km_tests() {
    if [ "$SKIP_KM_TESTS" != true ]; then
        echo ""
        echo "===== Executor kernel module ====="
        cd $SCRIPT_DIR || exit
        ./kernel_module.bats
        cd - >/dev/null || exit
    fi
}

function arch_unit_tests() {
    # Note: we intentionally do not use the 'discover' option because it causes cross-contamination
    # of config options between unit tests

    if [ "$ARCH" == "x86_64" ]; then
        echo ""
        echo "===== x86 unit tests ====="
        cd $SCRIPT_DIR/.. || exit
        python3 -m unittest tests.x86_tests.unit_isa_loader -v
        echo "-------------"
        python3 -m unittest tests.x86_tests.unit_generators -v
        echo "-------------"
        python3 -m unittest tests.x86_tests.unit_model -v
        echo "-------------"
        python3 -m unittest tests.x86_tests.unit_taint_tracker -v
        echo "-------------"
        python3 -m unittest tests.x86_tests.unit_dr_decoder -v
        echo "-------------"
        cd - >/dev/null || exit
        # exit
    else
        echo ""
        echo "===== arm64 unit tests ====="
        cd $SCRIPT_DIR/.. || exit
        cd $SCRIPT_DIR/.. || exit
        python3 -m unittest tests.arm64.unit_isa_loader -v
        echo "-------------"
        python3 -m unittest tests.arm64.unit_generators -v
        echo "-------------"
        # python3 -m unittest tests.arm64.unit_model -v
        # echo "-------------"
        # python3 -m unittest tests.arm64.unit_taint_tracker -v
        # echo "-------------"
        cd - >/dev/null || exit
        # exit
    fi
}

function acceptance_tests() {
    if [ "$SKIP_KM_TESTS" != true ]; then
        echo ""
        echo "===== Acceptance tests ====="
        cd $SCRIPT_DIR || exit
        ./acceptance.bats
        cd - >/dev/null || exit
    fi
}

# ==================================================================================================
# Runners
# ==================================================================================================
function run_one_stage() {
    local stage=$1

    case $stage in
    type_check)
        type_check $STRICT
        ;;
    code_style_check)
        code_style_check $STRICT
        ;;
    core_unit_tests)
        core_unit_tests
        ;;
    package_install_test)
        package_install_test
        ;;
    km_tests)
        km_tests
        ;;
    arch_unit_tests)
        arch_unit_tests
        ;;
    acceptance_tests)
        acceptance_tests
        ;;
    *)
        echo "Unknown stage: $stage"
        exit 1
        ;;
    esac
}

function main() {
    parse_args $@

    if [ "$IGNORE_ERRORS" != "true" ]; then
        set -e
    fi

    if [ "$STRICT" = true ]; then
        echo "Including optional tests"
    fi

    VENDOR="$(lscpu | grep Vendor | awk '{print $3}')"
    ARCH="$(lscpu | grep Architecture | awk '{print $2}')"

    SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" &>/dev/null && pwd)"
    ALL_PY=$(find rvzr/ -name "*.py" | grep -v "config" | grep -v "fuzzer")

    # if STAGE is set, run only that stage
    if [[ -n "$STAGE" ]]; then
        run_one_stage "$STAGE"
        exit 0
    fi

    type_check $STRICT
    code_style_check $STRICT
    package_install_test
    core_unit_tests
    km_tests
    arch_unit_tests
    acceptance_tests
}

main $@


================================================
FILE: tests/scripts/create_rcbf_file.py
================================================
#!/usr/bin/env python3
"""
File: create_rcbf_file.py
      Creates an RCBF test case file from an assembly source file.
      On details of the RCBF file format, see docs/devel/binary-formats.md

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

import sys
import os
import subprocess


def write_actor_metadata(f, entry):
    f.write((entry[0]).to_bytes(8, byteorder='little'))  # id
    f.write((entry[1]).to_bytes(8, byteorder='little'))  # mode
    f.write((entry[2]).to_bytes(8, byteorder='little'))  # pl
    f.write((entry[3]).to_bytes(8, byteorder='little'))  # data permissions
    f.write((entry[4]).to_bytes(8, byteorder='little'))  # data ept properties
    f.write((entry[5]).to_bytes(8, byteorder='little'))  # code permissions


def write_st_entry(f, entry):
    f.write((entry[0]).to_bytes(8, byteorder='little'))  # owner
    f.write((entry[1]).to_bytes(8, byteorder='little'))  # offset
    f.write((entry[2]).to_bytes(8, byteorder='little'))  # id
    f.write((entry[3]).to_bytes(8, byteorder='little'))  # args


def write_metadata_entry(f, entry):
    f.write((entry[0]).to_bytes(8, byteorder='little'))  # owner
    f.write((entry[1]).to_bytes(8, byteorder='little'))  # size
    f.write((entry[2]).to_bytes(8, byteorder='little'))  # reserved


def write_nop(f, arch: str):
    if arch == 'x86':
        f.write(b'\x0f\x1f\x84\x00\xff\x00\x00\x00')
    elif arch == 'arm64':
        f.write(b'\x1f\x20\x03\xd5\x1f\x20\x03\xd5\x1f\x20\x03\xd5')


def get_macro_placeholder_size(arch: str):
    if arch == 'x86':
        return 8
    return 12


def main(asm_file: str, obj_file: str, arch: str):
    n_actors = 1
    n_symbols = 3

    # compile the assembly file
    tmpbin = asm_file + '.o'
    subprocess.run(['as', asm_file, '-o', tmpbin])
    subprocess.run(['strip', '--remove-section=.note.gnu.property', tmpbin])
    subprocess.run(['objcopy', tmpbin, '-O', 'binary', tmpbin])
    main_size = os.path.getsize(tmpbin)

    # create the test case file
    with open(obj_file, 'wb') as f:
        # write the test case header
        f.write((n_actors).to_bytes(8, byteorder='little'))
        f.write((n_symbols).to_bytes(8, byteorder='little'))

        # write actor metadata
        write_actor_metadata(f, (0, 0, 0, 0x8000000000000063, 0, 0))

        # write the symbol table
        # - symbol 1: main
        write_st_entry(f, (0, 0, 0, 0))
        # - symbol 2: MACRO_MEASUREMENT_START
        write_st_entry(f, (0, 0, 1, 0))
        main_size += get_macro_placeholder_size(arch)
        # - symbol 3: MACRO_MEASUREMENT_END
        write_st_entry(f, (0, main_size, 2, 0))
        main_size += get_macro_placeholder_size(arch)

        # write the section metadata
        write_metadata_entry(f, (0, main_size, 0))

        # write the code
        write_nop(f, arch)  # nop - MACRO_MEASUREMENT_START
        with open(tmpbin, 'rb') as bin_file:
            code = bin_file.read()
            f.write(code)
        write_nop(f, arch)


if __name__ == '__main__':
    if len(sys.argv) != 4:
        print("Usage: %s <asm_file> <dest_file> <x86|arm64>" % sys.argv[0])
        sys.exit(1)

    if sys.argv[3] not in ['x86', 'arm64']:
        print("Invalid architecture: %s" % sys.argv[3])
        sys.exit(1)

    sys.exit(main(sys.argv[1], sys.argv[2], sys.argv[3]))


================================================
FILE: tests/scripts/create_rdbf_file.py
================================================
#!/usr/bin/env python3
"""
File: create_rdbf_file.py
      Creates an RDBF test case file from an assembly source file.
      On details of the RDBF file format, see docs/devel/binary-formats.md

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import sys


def main(dest_file: str, n_inputs: int, n_actors: int):
    # Open the destination file for writing
    with open(dest_file, 'wb') as f:
        # Write the header
        f.write(n_actors.to_bytes(8, byteorder='little'))  # Number of actors
        f.write(n_inputs.to_bytes(8, byteorder='little'))  # Number of inputs

        # Write metadata for each actor and input
        for _ in range(n_actors * n_inputs):
            f.write((4096 * 3).to_bytes(8, byteorder='little'))  # Section size
            f.write((0).to_bytes(8, byteorder='little'))  # Reserved

        # Write data sections for each actor and input
        for _ in range(n_inputs):
            for _ in range(n_actors):
                # Write main_area, faulty_area, and reg_init_region (each 4096 bytes)
                f.write(b'\x00' * 4096)  # main_area
                f.write(b'\x00' * 4096)  # faulty_area
                f.write(b'\x00' * 4096)  # reg_init_region

    return 0


if __name__ == '__main__':
    if len(sys.argv) != 4:
        print(f"Usage: {sys.argv[0]} <dest_file> <n_inputs> <n_actors>")
        sys.exit(1)
    try:
        n_inputs = int(sys.argv[2])
    except ValueError:
        print(f"Invalid number of inputs: {sys.argv[2]}")
        sys.exit(1)
    try:
        n_actors = int(sys.argv[3])
    except ValueError:
        print(f"Invalid number of actors: {sys.argv[3]}")
        sys.exit(1)

    sys.exit(main(sys.argv[1], n_inputs, n_actors))


================================================
FILE: tests/unit_analyser.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

import unittest
from typing import List

import numpy as np
import numpy.typing as npt

from rvzr.analyser import MergedBitmapAnalyser, SetAnalyser, ChiSquaredAnalyser
from rvzr.tc_components.test_case_data import InputData
from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.traces import CTrace, HTrace, RawHTraceSample, CTraceEntry
from rvzr.config import CONF


def _htrace_from_trace(trace_list: List[int]) -> HTrace:
    samples: npt.NDArray[np.void] = np.ndarray(len(trace_list), dtype=RawHTraceSample)
    for i, trace in enumerate(trace_list):
        samples[i] = (trace, 0, 0, 0, 0, 0)
    return HTrace(samples)


def _ctrace_from_int(trace: int) -> CTrace:
    return CTrace([CTraceEntry("val", trace)])


class AnalyserTest(unittest.TestCase):

    def test_merged_bitmap_analyser(self) -> None:
        analyser = MergedBitmapAnalyser()
        dummy_input = InputData()
        dummy_tc = TestCaseProgram("")
        inputs = [dummy_input] * 4

        htraces_int = [[0b1101, 0b1101], [0b1011, 0b1011], [0b1000, 0b1000], [0b1000, 0b1000]]
        htraces = [_htrace_from_trace(trace) for trace in htraces_int]

        ctraces_int = [1, 1, 2, 2]
        ctraces = [_ctrace_from_int(trace) for trace in ctraces_int]

        violations = analyser.filter_violations(ctraces, htraces, dummy_tc, inputs)
        self.assertEqual(len(violations), 1)
        self.assertEqual(violations[0].ctrace, ctraces[0])

    def test_set_analyser(self) -> None:
        analyser = SetAnalyser()
        dummy_input = InputData()
        dummy_tc = TestCaseProgram("")
        inputs = [dummy_input] * 4

        htraces_int = [[1, 2, 2, 1], [1, 3, 3, 1], [1, 1, 1, 1], [1, 1, 1, 1]]
        htraces = [_htrace_from_trace(trace) for trace in htraces_int]

        ctraces_int = [1, 1, 2, 2]
        ctraces = [_ctrace_from_int(trace) for trace in ctraces_int]

        violations = analyser.filter_violations(ctraces, htraces, dummy_tc, inputs)
        self.assertEqual(len(violations), 1)
        self.assertEqual(violations[0].ctrace, ctraces[0])

    def test_chi2_analyser(self) -> None:
        analyser = ChiSquaredAnalyser()
        dummy_input = InputData()
        dummy_tc = TestCaseProgram("")
        inputs = [dummy_input] * 4

        h1 = [1] * CONF.executor_sample_sizes[0]
        h2 = [2] * CONF.executor_sample_sizes[0]
        h2[0] = 1
        h2[1] = 1
        htraces = [
            _htrace_from_trace(h1),
            _htrace_from_trace(h2),
            _htrace_from_trace(h2),
            _htrace_from_trace(h2)
        ]

        ctraces_int = [1, 1, 2, 2]
        ctraces = [_ctrace_from_int(trace) for trace in ctraces_int]

        violations = analyser.filter_violations(ctraces, htraces, dummy_tc, inputs)
        self.assertEqual(len(violations), 1)
        self.assertEqual(violations[0].ctrace, ctraces[0])


================================================
FILE: tests/unit_docs.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from typing import Dict, List, Union

import unittest
import inspect
import pathlib
from rvzr.config import CONF

FILE_DIR = pathlib.Path(__file__).parent.resolve()
DOC_DIR = FILE_DIR.parent / "docs"

ACTOR_SECTION_HEADER = "## <a name=\"actor\"></a> Actor Configuration"
AVAILABLE_OPTIONS_HEADER = '=== "Available Options"'
DEFAULT_VALUE_PREFIX = ":material-water:"
AUTODETECTED_PREFIX = ":octicons-cpu-24:"


def _is_option_name(line: str) -> bool:
    # format: #### `option_name`
    return line.startswith("#### `") and "`" in line[6:]


def parse_config_options_from_docs(doc_lines: List[str]) -> Dict[str, List[Union[str, List[str]]]]:
    """
    Parse configuration options from the documentation.

    :param doc_lines: Lines from the config.md file
    :return: Dictionary mapping option names to [default_value, [available_options]]
    """
    doc_options: Dict[str, List[Union[str, List[str]]]] = {}
    curr_name: str = ""
    in_actor_section: bool = False
    in_available_options: bool = False

    for line in doc_lines:
        # Detect actor section
        if ACTOR_SECTION_HEADER in line:
            in_actor_section = True
        elif line.startswith("## "):
            in_actor_section = False

        # Parse option name from heading
        if _is_option_name(line):
            end_idx = line.index("`", 6)
            option_name = line[6:end_idx]

            # Add actor_ prefix if in actor section
            if in_actor_section:
                curr_name = f"actor_{option_name}"
            else:
                curr_name = option_name

            doc_options[curr_name] = ["", []]
            in_available_options = False

        # Parse default value (e.g., :material-water: `value`)
        elif curr_name and doc_options[curr_name][0] == "":
            if DEFAULT_VALUE_PREFIX in line and "`" in line:
                # Find backtick-quoted value after :material-water:
                parts = line.split("`")
                for j in range(1, len(parts), 2):
                    if j > 0 and DEFAULT_VALUE_PREFIX in parts[j - 1]:
                        doc_options[curr_name][0] = parts[j]
                        break
            elif AUTODETECTED_PREFIX in line:
                # Auto-detected default value
                doc_options[curr_name][0] = "(auto-detected)"

        # Detect Available Options section
        elif AVAILABLE_OPTIONS_HEADER in line:
            in_available_options = True

        # Parse available options (e.g., `opt1` | `opt2` | `opt3`)
        elif in_available_options and curr_name and "`" in line and "|" in line:
            options_line = line.strip()
            if options_line.startswith("`"):
                # Split by | and extract values between backticks
                parts = options_line.split("|")
                options = []
                for part in parts:
                    part = part.strip()
                    if part.startswith("`") and part.endswith("`"):
                        options.append(part.strip("`"))
                doc_options[curr_name][1] = options
            in_available_options = False

    return doc_options


class DocumentationTest(unittest.TestCase):
    """
    A class for testing if the documentation is up to date.
    """
    longMessage = False

    def test_conf_docs(self) -> None:
        # Test if the documentation contains all the config options.

        # get the text of the config documentation
        with open(DOC_DIR / "ref/config.md", "r") as f:
            doc_text = f.read()

        # get a list of config options
        options = [
            k[0]
            for k in inspect.getmembers(CONF, lambda x: not inspect.isroutine(x))
            if not k[0].startswith("_")
        ]

        # check if each option is in the documentation
        for option in options:
            self.assertTrue(option in doc_text, msg=f"{option} not found in documentation")

    def test_conf_options_docs(self) -> None:
        # Test if the documentation contains all possible values for the config options.

        # get the text of the config documentation
        with open(DOC_DIR / "ref/config.md", "r") as f:
            doc_text = f.readlines()

        # build a map of config options to their possible values in the doc
        doc_options = parse_config_options_from_docs(doc_text)

        # get a list of config options
        options = [
            k for k in inspect.getmembers(CONF, lambda x: not inspect.isroutine(x))
            if not k[0].startswith("_")
        ]
        alternatives = CONF._option_values  # pylint: disable=protected-access

        # check if all alternatives and defaults are documented
        for name, default_ in options:
            doc_default = doc_options[name][0]
            assert isinstance(doc_default, str)
            if not doc_default.startswith("("):
                self.assertEqual(
                    str(default_),
                    doc_default,
                    msg=f"Default for `{name}` is incorrect: {default_} != {doc_default}")

            if doc_options[name][1]:
                doc_values = doc_options[name][1]
                self.assertSetEqual(
                    set(alternatives[name]),
                    set(doc_values),
                    msg=f"Options for `{name}` are incorrect: {alternatives[name]} != {doc_values}")


================================================
FILE: tests/unit_fuzzer.py
================================================
"""
File: Unit tests for rvzr/fuzzer.py

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring,missing-class-docstring,protected-access
# pylint: disable=too-many-instance-attributes,too-many-public-methods

from __future__ import annotations

import unittest
from unittest.mock import MagicMock, patch
from typing import List, Any, Iterator
from contextlib import contextmanager
import numpy as np

from rvzr.fuzzer import Fuzzer, _RoundManager, _RoundState
from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.tc_components.test_case_data import InputData
from rvzr.traces import CTrace, HTrace, CTraceEntry, RawHTraceSample, TraceBundle, Violation, \
    ArrayOfSamples
from rvzr.config import CONF
from rvzr.logs import update_logging_after_config_change


def _mk_ctrace(value: int) -> CTrace:
    """Helper to create a simple contract trace"""
    return CTrace([CTraceEntry("val", value)])


def _mk_htrace(trace_value: int, sample_size: int = 100) -> HTrace:
    """Helper to create a hardware trace with repeated samples"""
    samples: ArrayOfSamples = np.ndarray(sample_size, dtype=RawHTraceSample)
    for i in range(sample_size):
        samples[i] = (trace_value, 0, 0, 0, 0, 0)
    return HTrace(samples, "cache")


def _mk_violation(n_inputs: int = 2) -> Violation:
    """Helper to create a mock violation"""
    inputs = [InputData() for _ in range(n_inputs)]
    measurements = [
        TraceBundle(
            input_id=i,
            input_=inputs[i],
            ctrace=_mk_ctrace(1),  # same ctrace
            htrace=_mk_htrace(0x100 + i)  # different htraces
        ) for i in range(n_inputs)
    ]
    test_case = TestCaseProgram("test.asm")
    violation = Violation(measurements, inputs, test_case)
    violation.set_trivial_hw_classes()
    return violation


@contextmanager
def _temp_conf_override(**kwargs: Any) -> Iterator[None]:
    """Context manager to temporarily override CONF settings"""
    original_values = {}
    for key, value in kwargs.items():
        if hasattr(CONF, key):
            original_values[key] = getattr(CONF, key)
            setattr(CONF, key, value)

    try:
        yield
    finally:
        for key, value in original_values.items():
            setattr(CONF, key, value)
        update_logging_after_config_change()


class _MockSetup:
    """Helper class to setup standard mocks for fuzzing tests"""

    def __init__(self, inputs: List[InputData]) -> None:
        self.inputs = inputs
        self.boosted_inputs = inputs * 2
        self.ctraces = [_mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(1)]
        self.htraces = [
            _mk_htrace(0x100), _mk_htrace(0x100), _mk_htrace(0x200), _mk_htrace(0x200)
        ]

    def configure_mocks(
        self,
        data_gen: MagicMock,
        model: MagicMock,
        executor: MagicMock,
        analyser: MagicMock,
        violations: List[Violation] | None = None
    ) -> None:
        """Configure standard mock returns for a typical fuzzing round"""
        data_gen.generate_boosted.return_value = self.boosted_inputs
        model.trace_test_case_with_taints.return_value = (self.ctraces[:2], [None, None])
        model.trace_test_case.return_value = self.ctraces
        executor.trace_test_case.return_value = self.htraces
        analyser.filter_violations.return_value = violations if violations is not None else []


class FuzzerRoundTest(unittest.TestCase):
    """
    Comprehensive tests for the fuzzing_round method and its multi-stage violation detection.
    This test exercises the main fuzzing loop which has the lowest coverage in fuzzer.py.
    """

    def setUp(self) -> None:
        """Set up mock objects for fuzzer components"""
        # Save original config state
        self.orig_logging = CONF.logging_modes
        self.orig_sample_sizes = CONF.executor_sample_sizes
        self.orig_inputs_per_class = CONF.inputs_per_class
        self.orig_fast_path = CONF.enable_fast_path_model
        self.orig_priming = CONF.enable_priming

        # Configure for testing
        CONF.logging_modes = []
        CONF.executor_sample_sizes = [100, 200, 500]
        CONF.inputs_per_class = 2
        CONF.enable_fast_path_model = True
        CONF.enable_priming = True
        CONF.model_min_nesting = 1
        CONF.model_max_nesting = 3
        update_logging_after_config_change()

        # Create test data
        self.test_case = TestCaseProgram("test.asm")
        self.inputs = [InputData(), InputData()]

        # Mock components
        self.mock_model = MagicMock()
        self.mock_model.is_speculative = True

        self.mock_executor = MagicMock()
        self.mock_arch_model = MagicMock()
        self.mock_arch_executor = MagicMock()

        self.mock_analyser = MagicMock()
        self.mock_code_gen = MagicMock()
        self.mock_data_gen = MagicMock()
        self.mock_elf_parser = MagicMock()
        self.mock_asm_parser = MagicMock()

        # Create a minimal fuzzer with mocked components
        # Using __new__ bypasses __init__, so no factory is called
        self.fuzzer = Fuzzer.__new__(Fuzzer)
        self.fuzzer.model = self.mock_model
        self.fuzzer.executor = self.mock_executor
        self.fuzzer.arch_model = self.mock_arch_model
        self.fuzzer.arch_executor = self.mock_arch_executor
        self.fuzzer.analyser = self.mock_analyser
        self.fuzzer.code_gen = self.mock_code_gen
        self.fuzzer.data_gen = self.mock_data_gen
        self.fuzzer.elf_parser = self.mock_elf_parser
        self.fuzzer.asm_parser = self.mock_asm_parser
        self.fuzzer.log = MagicMock()
        self.fuzzer._work_dir = "/tmp/test"

    def tearDown(self) -> None:
        """Restore original config state"""
        CONF.logging_modes = self.orig_logging
        CONF.executor_sample_sizes = self.orig_sample_sizes
        CONF.inputs_per_class = self.orig_inputs_per_class
        CONF.enable_fast_path_model = self.orig_fast_path
        CONF.enable_priming = self.orig_priming
        update_logging_after_config_change()

    def test_fuzzing_round_no_violation_fast_path(self) -> None:
        # Test fuzzing_round when no violations are found in the fast path

        boosted_inputs = self.inputs * 2  # inputs_per_class=2
        ctraces = [_mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(2), _mk_ctrace(2)]
        htraces = [_mk_htrace(0x100), _mk_htrace(0x100), _mk_htrace(0x200), _mk_htrace(0x200)]

        self.mock_data_gen.generate_boosted.return_value = boosted_inputs
        self.mock_model.trace_test_case_with_taints.return_value = (ctraces[:2], [None, None])
        self.mock_model.trace_test_case.return_value = ctraces
        self.mock_executor.trace_test_case.return_value = htraces
        self.mock_analyser.filter_violations.return_value = []

        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])
        self.assertIsNone(result)

    def test_fuzzing_round_violation_detected_survives_all_stages(self) -> None:
        # Test fuzzing_round when a genuine violation survives all false positive filters

        with _temp_conf_override(enable_priming=False):
            # Setup: return violations through all stages
            violation = _mk_violation(4)
            mock_setup = _MockSetup(self.inputs)
            mock_setup.configure_mocks(
                self.mock_data_gen, self.mock_model, self.mock_executor,
                self.mock_analyser, [violation]
            )

            # Architectural mismatch check should pass (no mismatch) - same register values
            # get_untyped() returns the first 6 values for comparison
            arch_htrace_data: ArrayOfSamples = np.ndarray(1, dtype=RawHTraceSample)
            arch_htrace_data[0] = (1, 2, 3, 4, 5, 6)
            arch_htraces = [HTrace(arch_htrace_data, "reg") for _ in range(4)]
            arch_ctraces = [
                CTrace([CTraceEntry("val", v) for v in [1, 2, 3, 4, 5, 6]]) for _ in range(4)
            ]
            self.mock_arch_executor.trace_test_case.return_value = arch_htraces
            self.mock_arch_model.trace_test_case.return_value = arch_ctraces

            # Execute
            result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

            # Verify: violation should survive all stages
            self.assertIsNotNone(result)
            self.assertEqual(result, violation)

    def test_fuzzing_round_fp_filtered_by_nesting(self) -> None:
        # Test that false positives due to insufficient nesting are filtered out
        violation = _mk_violation(4)
        mock_setup = _MockSetup(self.inputs)
        mock_setup.configure_mocks(
            self.mock_data_gen, self.mock_model, self.mock_executor, self.mock_analyser
        )

        # First call (fast path) returns violation, second call (nesting) returns no violation
        self.mock_analyser.filter_violations.side_effect = [[violation], []]

        # Execute
        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

        # Verify: violation should be filtered out after nesting stage
        self.assertIsNone(result)

    def test_fuzzing_round_fp_filtered_by_taint_mistake(self) -> None:
        # Test that false positives due to taint tracking errors are filtered out
        boosted_inputs = self.inputs * 2
        ctraces_fast = [_mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(1)]
        ctraces_full = [_mk_ctrace(1), _mk_ctrace(2), _mk_ctrace(1), _mk_ctrace(2)]
        htraces = [_mk_htrace(0x100), _mk_htrace(0x100), _mk_htrace(0x200), _mk_htrace(0x200)]

        violation = _mk_violation(4)

        self.mock_data_gen.generate_boosted.return_value = boosted_inputs
        self.mock_model.trace_test_case_with_taints.return_value = (ctraces_fast[:2], [None, None])

        # Return different ctraces when called with full tracing (taint_mistake stage)
        self.mock_model.trace_test_case.side_effect = [ctraces_fast, ctraces_fast, ctraces_full]
        self.mock_executor.trace_test_case.return_value = htraces

        # Violation appears with fast ctraces, disappears with full ctraces
        self.mock_analyser.filter_violations.side_effect = [[violation], [violation], []]

        # Execute
        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

        # Verify: violation should be filtered out after taint_mistake stage
        self.assertIsNone(result)

    def test_fuzzing_round_fp_filtered_by_priming(self) -> None:
        # Test that false positives due to cross-talk between inputs are filtered by priming"""
        violation = _mk_violation(4)
        mock_setup = _MockSetup(self.inputs)
        mock_setup.configure_mocks(
            self.mock_data_gen, self.mock_model, self.mock_executor,
            self.mock_analyser, [violation]
        )

        # Priming check: traces are NOT equivalent (false positive)
        self.mock_analyser.htraces_are_equivalent.return_value = False

        # Execute
        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

        # Verify: violation should be filtered out by priming
        self.assertIsNone(result)

    def test_fuzzing_round_noise_stage_extends_htraces(self) -> None:
        # Test that noise stage extends htraces with larger sample sizes"""
        # Configure for single sample size to skip noise stage initially
        orig_sample_sizes = CONF.executor_sample_sizes
        CONF.executor_sample_sizes = [100]  # Single sample size - skips noise stage

        try:
            boosted_inputs = self.inputs * 2
            ctraces = [_mk_ctrace(1), _mk_ctrace(1), _mk_ctrace(2), _mk_ctrace(2)]
            htraces = [
                _mk_htrace(0x100, 100),
                _mk_htrace(0x100, 100),
                _mk_htrace(0x200, 100),
                _mk_htrace(0x200, 100)
            ]

            self.mock_data_gen.generate_boosted.return_value = boosted_inputs
            self.mock_model.trace_test_case_with_taints.return_value = (ctraces[:2], [None, None])
            self.mock_model.trace_test_case.return_value = ctraces
            self.mock_executor.trace_test_case.return_value = htraces
            self.mock_analyser.filter_violations.return_value = []

            # Execute
            result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

            # Verify: no violation, noise stage was skipped
            self.assertIsNone(result)
            # Only fast path should execute
            self.assertEqual(self.mock_executor.trace_test_case.call_count, 1)
        finally:
            CONF.executor_sample_sizes = orig_sample_sizes

    def test_fuzzing_round_architectural_mismatch_detected(self) -> None:
        # Test detection of architectural mismatches between model and executor"""
        # Temporarily disable priming to simplify test, and set work_dir to None
        # to prevent file writing on architectural mismatch
        self.fuzzer._work_dir = ""  # Disable file writing

        with _temp_conf_override(enable_priming=False):
            violation = _mk_violation(4)
            mock_setup = _MockSetup(self.inputs)
            mock_setup.configure_mocks(
                self.mock_data_gen, self.mock_model, self.mock_executor,
                self.mock_analyser, [violation]
            )

            # Architectural mismatch: model and executor return different register values
            # Hardware returns specific register values
            arch_htrace_data: ArrayOfSamples = np.ndarray(1, dtype=RawHTraceSample)
            arch_htrace_data[0] = (1, 2, 3, 4, 5, 6)
            arch_htraces = [HTrace(arch_htrace_data, "reg") for _ in range(4)]

            # Model returns different values (mismatch!) - get_untyped()[:6] is compared
            arch_ctraces = [
                CTrace([CTraceEntry("val", v) for v in [999, 2, 3, 4, 5, 6]]) for _ in range(4)
            ]

            self.mock_arch_executor.trace_test_case.return_value = arch_htraces
            self.mock_arch_model.trace_test_case.return_value = arch_ctraces

            # Execute - suppress warning by mocking the report method
            with patch.object(self.fuzzer, '_report_bug_arch'):
                result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

            # Verify: architectural mismatch should filter the violation
            self.assertIsNone(result)

        self.fuzzer._work_dir = "/tmp/test"

    def test_fuzzing_round_executor_error_handled(self) -> None:
        # Test that IOErrors from executor are handled gracefully"""
        mock_setup = _MockSetup(self.inputs)
        self.mock_data_gen.generate_boosted.return_value = mock_setup.boosted_inputs
        self.mock_model.trace_test_case_with_taints.return_value = (
            mock_setup.ctraces[:2], [None, None]
        )
        self.mock_model.trace_test_case.return_value = mock_setup.ctraces

        # Executor raises IOError
        self.mock_executor.trace_test_case.side_effect = IOError("Trace collection failed")

        # Execute
        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, [])

        # Verify: should handle error and return None
        self.assertIsNone(result)

    def test_fuzzing_round_with_ignore_list(self) -> None:
        # Test that starting ignore list is properly set in executor"""
        mock_setup = _MockSetup(self.inputs)
        mock_setup.configure_mocks(
            self.mock_data_gen, self.mock_model, self.mock_executor, self.mock_analyser
        )

        # Execute with ignore list
        ignore_list = [0, 1]
        result = self.fuzzer.fuzzing_round(self.test_case, self.inputs, ignore_list)

        # Verify
        self.assertIsNone(result)

    def test_fuzzing_round_empty_inputs(self) -> None:
        # Test fuzzing_round with empty input list"""
        empty_inputs: List[InputData] = []

        # With empty inputs, no violations should be checked
        self.mock_data_gen.generate_boosted.return_value = []
        self.mock_model.trace_test_case_with_taints.return_value = ([], [])
        self.mock_model.trace_test_case.return_value = []
        self.mock_executor.trace_test_case.return_value = []

        # Execute
        result = self.fuzzer.fuzzing_round(self.test_case, empty_inputs, [])

        # Verify: should complete without errors
        self.assertIsNone(result)
        # filter_violations should not be called with empty inputs
        self.mock_analyser.filter_violations.assert_not_called()

    def test_round_state_configuration(self) -> None:
        # Test _RoundState initialization with different model types"""
        # Test with speculative model
        state_spec = _RoundState(is_speculative=True)
        self.assertEqual(state_spec.model_nesting, CONF.model_min_nesting)
        self.assertEqual(state_spec.max_nesting, CONF.model_max_nesting)
        self.assertTrue(state_spec.enable_priming)
        self.assertTrue(state_spec.enable_fast_contract_tracing)

        # Test with non-speculative model
        state_non_spec = _RoundState(is_speculative=False)
        self.assertEqual(state_non_spec.model_nesting, 1)
        self.assertEqual(state_non_spec.max_nesting, 1)

    def test_round_manager_stage_execution_order(self) -> None:
        # Test that round manager executes stages in the correct order"""
        mock_setup = _MockSetup(self.inputs)
        mock_setup.configure_mocks(
            self.mock_data_gen, self.mock_model, self.mock_executor, self.mock_analyser
        )

        # Create round manager
        round_mgr = _RoundManager(self.fuzzer, self.test_case, self.inputs)

        # Execute stages
        round_mgr.execute_stage("fast")
        self.assertFalse(round_mgr.conf.is_initial)
        self.assertFalse(round_mgr.conf.record_stats)

        round_mgr.execute_stage("nesting")
        self.assertTrue(round_mgr.conf.reuse_boosts)
        self.assertTrue(round_mgr.conf.update_ignore_list)

        round_mgr.execute_stage("taint_mistake")
        self.assertTrue(round_mgr.conf.reuse_ctraces)

        round_mgr.finalize()


class FuzzerStartTest(unittest.TestCase):
    """Tests for the main fuzzing loop start() method"""

    def setUp(self) -> None:
        """Set up minimal mock fuzzer for start() tests"""
        self.orig_logging = CONF.logging_modes
        CONF.logging_modes = []
        update_logging_after_config_change()

        # Create minimal fuzzer using __new__ to bypass __init__ and factory
        self.fuzzer = Fuzzer.__new__(Fuzzer)
        self.fuzzer.log = MagicMock()
        self.fuzzer.code_gen = MagicMock()
        self.fuzzer.data_gen = MagicMock()
        self.fuzzer.model = MagicMock()
        self.fuzzer.executor = MagicMock()
        self.fuzzer.analyser = MagicMock()
        self.fuzzer._work_dir = "/tmp/test"
        self.fuzzer._input_paths = []
        self.fuzzer._existing_test_case = ""

        # Mock generation
        self.test_case = TestCaseProgram("test.asm")
        self.fuzzer.code_gen.create_test_case.return_value = self.test_case

        # Mock data generation
        self.inputs = [InputData(), InputData()]
        self.fuzzer.data_gen.generate.return_value = self.inputs

    def tearDown(self) -> None:
        CONF.logging_modes = self.orig_logging
        update_logging_after_config_change()

    def test_start_no_violations_found(self) -> None:
        # Test start() when no violations are found"""
        # Mock fuzzing_round to return no violations
        with patch.object(self.fuzzer, 'fuzzing_round', return_value=None):
            result = self.fuzzer.start(
                num_test_cases=5,
                num_inputs=2,
                timeout=0,
                nonstop=False,
                save_violations=False,
                type_="random")

        # Verify
        self.assertFalse(result)

    def test_start_violation_found_stop(self) -> None:
        # Test start() stops after finding first violation when nonstop=False"""
        violation = _mk_violation()

        # Mock fuzzing_round to return violation on second iteration
        with patch.object(self.fuzzer, 'fuzzing_round', side_effect=[None, violation]):
            result = self.fuzzer.start(
                num_test_cases=5,
                num_inputs=2,
                timeout=0,
                nonstop=False,
                save_violations=False,
                type_="random")

        # Verify: should stop after violation
        self.assertTrue(result)

    def test_start_violation_found_nonstop(self) -> None:
        # Test start() continues after finding violation when nonstop=True"""
        violation = _mk_violation()

        # Mock fuzzing_round to return violations multiple times
        with patch.object(
                self.fuzzer, 'fuzzing_round', side_effect=[violation, None, violation, None]):
            result = self.fuzzer.start(
                num_test_cases=4,
                num_inputs=2,
                timeout=0,
                nonstop=True,
                save_violations=False,
                type_="random")

        # Verify: should continue through all test cases
        self.assertTrue(result)


if __name__ == '__main__':
    unittest.main()


================================================
FILE: tests/unit_isa_loader.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import unittest

import os
import tempfile

from rvzr.isa_spec import InstructionSet
from rvzr.instruction_spec import OT, InstructionSpec

basic = """
[
{"name": "test", "category": "CATEGORY", "is_control_flow": true,
  "operands": [
    {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
    {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16}
  ],
  "implicit_operands": [
    {"type_": "FLAGS", "values": ["w", "r", "undef", "w", "w", "", "", "", "w"],
     "src": false, "dest": false, "width": 0}
  ]
},
{"name": "test2", "category": "CATEGORY", "is_control_flow": false,
  "operands": [
    {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
  ],
  "implicit_operands": []
}
]
"""

duplicate = """
[
{"name": "test", "category": "CATEGORY", "is_control_flow": false,
  "operands": [
    {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
  ],
  "implicit_operands": []
},
{"name": "test", "category": "CATEGORY", "is_control_flow": false,
  "operands": [
    {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
  ],
  "implicit_operands": []
}
]
"""


class InstructionSetParserTest(unittest.TestCase):

    def test_parsing(self) -> None:
        spec_file = tempfile.NamedTemporaryFile("w", delete=False)
        with open(spec_file.name, "w") as f:
            f.write(basic)

        instruction_set = InstructionSet(spec_file.name)
        spec_file.close()
        os.unlink(spec_file.name)

        spec: InstructionSpec = instruction_set.instructions[0]
        self.assertEqual(spec.name, "test")
        self.assertEqual(spec.category, "CATEGORY")
        self.assertEqual(spec.has_mem_operand, True)
        self.assertEqual(spec.has_write, True)
        self.assertEqual(spec.is_control_flow, True)

        self.assertEqual(len(spec.operands), 2)
        op1 = spec.operands[0]
        self.assertEqual(op1.type, OT.MEM)
        self.assertEqual(op1.width, 16)
        self.assertEqual(op1.src, True)
        self.assertEqual(op1.dest, True)

        op2 = spec.operands[1]
        self.assertEqual(op2.type, OT.REG)
        self.assertEqual(op2.values, ("ax",))
        self.assertEqual(op2.src, True)
        self.assertEqual(op2.dest, False)

        self.assertEqual(len(spec.implicit_operands), 1)
        flags = spec.implicit_operands[0]
        self.assertEqual(flags.type, OT.FLAGS)
        self.assertEqual(flags.values, ('w', 'r', 'undef', 'w', 'w', '', '', '', 'w'))

    def test_dedup_identical(self) -> None:
        spec_file = tempfile.NamedTemporaryFile("w", delete=False)
        with open(spec_file.name, "w") as f:
            f.write(duplicate)

        instruction_set = InstructionSet(spec_file.name)
        spec_file.close()
        os.unlink(spec_file.name)

        self.assertEqual(len(instruction_set.instructions), 1, "No deduplication")


================================================
FILE: tests/unit_stats.py
================================================
"""
File: Unit tests for stats.py

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring  # no need in tests
# pylint: disable=missing-class-docstring  # no need in tests

import unittest

from rvzr.stats import FuzzingStats


class StatsTest(unittest.TestCase):

    def test_borg(self) -> None:
        stats1 = FuzzingStats()
        stats1.test_cases = 1
        stats2 = FuzzingStats()
        self.assertEqual(stats2.test_cases, 1)

    def test_str(self) -> None:
        stats = FuzzingStats()
        stats.test_cases = 1
        str_ = str(stats)
        self.assertIn("Test Cases: 1", str_)

        stats.num_inputs = 2
        str_ = str(stats)
        self.assertIn("Inputs per test case: 2.0", str_)

        stats.violations = 3
        str_ = str(stats)
        self.assertIn("Violations: 3", str_)

    def test_get_brief(self) -> None:
        stats = FuzzingStats()
        stats.test_cases = 0
        brief = stats.get_brief()
        self.assertEqual(brief, "")

        stats.test_cases = 1
        stats.eff_classes = 2
        stats.single_entry_classes = 3
        stats.analysed_test_cases = 4
        stats.num_inputs = 5
        stats.executor_reruns = 6
        stats.spec_filter = 7
        stats.observ_filter = 8
        stats.fast_path = 9
        stats.fp_nesting = 10
        stats.fp_taint_mistakes = 11
        stats.fp_early_priming = 12
        stats.fp_large_sample = 13
        stats.fp_priming = 14
        stats.violations = 15

        brief = stats.get_brief()
        self.assertEqual(brief,
                         "Cls:0/1,In:5,R:1,SF:7,OF:8,Fst:9,CN:10,CT:11,P1:12,CS:13,P2:14,V:15")

        stats.analysed_test_cases = 0
        brief = stats.get_brief()
        self.assertEqual(brief,
                         "Cls:0/0,In:5,R:1,SF:7,OF:8,Fst:9,CN:10,CT:11,P1:12,CS:13,P2:14,V:15")


================================================
FILE: tests/unit_tc_components.py
================================================
"""
File: Selection of unit tests for the data container classes

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring  # no need in tests
# pylint: disable=missing-class-docstring  # no need in tests

import os
import random
import unittest
from unittest.mock import MagicMock

import tempfile
import numpy as np

from rvzr.tc_components.actor import Actor, ActorMode, ActorPL
from rvzr.tc_components.test_case_code import CodeSection, TestCaseProgram, BasicBlock, Function
from rvzr.tc_components.test_case_binary import TestCaseBinary, SymbolTableEntry
from rvzr.tc_components.test_case_data import InputData, _ACTOR_DATA_SIZE
from rvzr.instruction_spec import InstructionSpec, OperandSpec, OT
from rvzr.tc_components.instruction import Instruction, Operand, \
    copy_op_with_flow_modification, copy_op_with_value_modification, copy_inst_with_modification, \
    RegisterOp, MemoryOp, ImmediateOp, LabelOp, AgenOp, CondOp, \
    FlagsOp
from rvzr.config import ActorConf


def _get_dummy_actor_dict() -> ActorConf:
    actor_dict: ActorConf = {
        'mode': 'host',
        'privilege_level': 'kernel',
        'name': 'test_actor',
        'data_properties': {
            'randomized': False,
            'user': True
        },
        'data_ept_properties': {
            'randomized': False,
            'user': True,
        },
        'observer': False,
        "instruction_blocklist": set(),
        "fault_blocklist": set(),
    }
    return actor_dict


def _get_mock_target_desc() -> MagicMock:
    mock_td = MagicMock()
    mock_td.pte_bits = {'user': (0, False)}
    mock_td.vm_pte_bits = {'user': (0, False)}
    mock_td.page_property_to_pte_bit_name = {
        "user": ("user", False),
    }
    mock_td.page_property_to_vm_pte_bit_name = {
        "user": ("user", False),
    }
    return mock_td


class ActorTest(unittest.TestCase):

    def test_dict_constructor(self) -> None:
        # Mock actor_dict
        actor_dict = _get_dummy_actor_dict()

        # Create Actor from dict
        actor = Actor.from_dict(actor_dict, _get_mock_target_desc())

        # Assertions
        self.assertEqual(actor.mode, ActorMode.HOST)
        self.assertEqual(actor.privilege_level, ActorPL.KERNEL)
        self.assertEqual(actor.name, 'test_actor')
        self.assertFalse(actor.observer)

        # Guest/User Actor
        actor_dict['mode'] = 'guest'
        actor_dict['privilege_level'] = 'user'
        actor = Actor.from_dict(actor_dict, _get_mock_target_desc())
        self.assertEqual(actor.mode, ActorMode.GUEST)
        self.assertEqual(actor.privilege_level, ActorPL.USER)

        # Invalid privilege level
        actor_dict['privilege_level'] = 'invalid_pl'
        with self.assertRaises(ValueError):
            _ = Actor.from_dict(actor_dict, _get_mock_target_desc())

        # Invalid mode
        actor_dict['mode'] = 'invalid_mode'
        with self.assertRaises(ValueError):
            _ = Actor.from_dict(actor_dict, _get_mock_target_desc())

    def test_create_main(self) -> None:
        # Call the create_main method
        main_actor = Actor.create_main()

        # Assert the properties of the returned Actor object
        self.assertEqual(main_actor.mode, ActorMode.HOST)
        self.assertEqual(main_actor.privilege_level, ActorPL.KERNEL)
        self.assertEqual(main_actor.name, "main")

    def test_get_id(self) -> None:
        # Create an Actor instance
        actor_dict = _get_dummy_actor_dict()
        actor = Actor.from_dict(actor_dict, _get_mock_target_desc())
        section = CodeSection(actor)

        # Call get_id without assigning an ElfSection and assert it raises an AssertionError
        with self.assertRaises(AssertionError):
            actor.get_id()

        # Create and assign an elf data
        section.assign_elf_data(offset=0, size=0, id_=42)

        # Call get_id and assert the returned ID
        self.assertEqual(actor.get_id(), 42)

    def test_is_main(self) -> None:
        actor_dict = _get_dummy_actor_dict()
        actor_dict['name'] = 'main'
        target_desc = _get_mock_target_desc()

        main_actor = Actor.from_dict(actor_dict, target_desc)
        self.assertTrue(main_actor.is_main)

        actor_dict['name'] = 'non_main_actor'
        non_main_actor = Actor.from_dict(actor_dict, target_desc)
        self.assertFalse(non_main_actor.is_main)

    def test_pte_constructor(self) -> None:
        actor_dict = _get_dummy_actor_dict()
        actor_dict['data_properties'] = {'randomized': False, 'user': False}
        actor_dict['data_ept_properties'] = {'randomized': False, 'user': False}

        # Mock target_desc
        target_desc = _get_mock_target_desc()

        # Create Actor from dict
        actor = Actor.from_dict(actor_dict, target_desc)
        self.assertEqual(actor.data_properties, 0)
        self.assertEqual(actor.data_ept_properties, 0)

        actor_dict['data_properties'] = {'randomized': True, 'user': True}
        actor_dict['data_ept_properties'] = {'randomized': True, 'user': True}
        random.seed(52)

        actor = Actor.from_dict(actor_dict, target_desc)
        self.assertEqual(actor.data_properties, 1)
        self.assertEqual(actor.data_ept_properties, 0)


class InstructionSpecTest(unittest.TestCase):

    def test_OT_str(self) -> None:
        self.assertEqual(str(OT.REG), "REG")
        self.assertEqual(str(OT.MEM), "MEM")
        self.assertEqual(str(OT.IMM), "IMM")
        self.assertEqual(str(OT.LABEL), "LABEL")
        self.assertEqual(str(OT.AGEN), "AGEN")
        self.assertEqual(str(OT.FLAGS), "FLAGS")
        self.assertEqual(str(OT.COND), "COND")

    def test_operand_str(self) -> None:
        # Create an OperandSpec object
        operand = OperandSpec(values=['rax', 'rbx'], type_=OT.REG, src=True, dest=False)

        # Assert the string representation of the OperandSpec object
        self.assertEqual(str(operand), "(rax, rbx)")

        # Check the string representation of an OperandSpec object with no values
        operand = OperandSpec(values=[], type_=OT.REG, src=True, dest=False)
        self.assertEqual(str(operand), "()")

    def test_instruction_spec_str(self) -> None:
        # Create an InstructionSpec object with operands
        operand = OperandSpec(values=['rax', 'rbx'], type_=OT.REG, src=True, dest=False)
        instruction = InstructionSpec(name='MOV', category='MOV')
        instruction.operands.append(operand)

        # Assert the string representation of the InstructionSpec object
        self.assertEqual(str(instruction), "MOV (rax, rbx) ")

    def test_instruction_spec_hash(self) -> None:
        # Create an InstructionSpec object
        operand = OperandSpec(values=['rax', 'rbx'], type_=OT.REG, src=True, dest=False)
        instruction = InstructionSpec(name='MOV', category='MOV')
        instruction.operands.append(operand)

        # Assert the hash of the InstructionSpec object
        self.assertEqual(hash(instruction), hash(str(instruction)))


class OperandTest(unittest.TestCase):

    def test_operand_from_spec(self) -> None:
        for type_ in [OT.REG, OT.MEM, OT.IMM, OT.LABEL, OT.AGEN, OT.FLAGS, OT.COND]:
            values = ["val"] if type_ != OT.FLAGS else ["", "", "", "", "", "", "", "", ""]
            val = "val" if type_ != OT.FLAGS else "flags"
            src = True if type_ != OT.FLAGS else False  # pylint: disable=simplifiable-if-expression

            # Create an OperandSpec object
            operand_spec = OperandSpec(values=values, type_=type_, src=src, dest=False, width=8)

            # Create an Operand object from the OperandSpec object
            operand = Operand.from_fixed_spec(operand_spec)

            # Assert the properties of the Operand object
            self.assertEqual(operand.value, val)
            self.assertEqual(operand.src, src)
            self.assertFalse(operand.dest)

    def test_flag_print(self) -> None:
        operand = FlagsOp(("", "", "", "", "", "", "", "", ""))
        self.assertEqual(str(operand), "FLAGS: CF|PF|AF|ZF|SF|TF|IF|DF|OF")

    def test_flag_accessors(self) -> None:
        # ("CF", "PF", "AF", "ZF", "SF", "TF", "IF", "DF", "OF")
        operand = FlagsOp(("w", "r", "r/w", "r/cw", "undef", "", "", "", ""))

        self.assertEqual(operand.get_flags_by_type("read"), ["PF", "AF", "ZF"])
        self.assertEqual(operand.get_flags_by_type("write"), ["CF", "AF", "ZF"])
        self.assertEqual(operand.get_flags_by_type("overwrite"), ["CF"])
        self.assertEqual(operand.get_flags_by_type("undef"), ["SF"])

    def test_operand_copy_methods(self) -> None:
        reg_op = RegisterOp("rax", 64, True, False)
        mem_op = MemoryOp("0x0", 64, True, False)
        imm_op = ImmediateOp("0x0", 64)
        label_op = LabelOp("label")
        agen_op = AgenOp("0x0", 64)
        cond_op = CondOp("cond")

        # Test copy_op_with_value_modification
        for op in [reg_op, mem_op, imm_op, label_op, agen_op, cond_op]:
            new_op = copy_op_with_value_modification(op, "new_val")  # type: ignore
            self.assertEqual(new_op.value, "new_val")
            self.assertEqual(new_op.src, op.src)
            self.assertEqual(new_op.dest, op.dest)

        # Test copy_op_with_flow_modification - src
        for op in [reg_op, mem_op]:
            new_op = copy_op_with_flow_modification(op, src=False)  # type: ignore
            self.assertEqual(new_op.value, op.value)
            self.assertEqual(new_op.width, op.width)  # type: ignore
            self.assertEqual(new_op.dest, op.dest)
            self.assertFalse(new_op.src)

        # Test copy_op_with_flow_modification - dest
        for op in [reg_op, mem_op]:
            new_op = copy_op_with_flow_modification(op, dest=True)  # type: ignore
            self.assertEqual(new_op.value, op.value)
            self.assertEqual(new_op.width, op.width)  # type: ignore
            self.assertEqual(new_op.src, op.src)
            self.assertTrue(new_op.dest)


class InstructionTest(unittest.TestCase):

    def test_instruction_from_spec(self) -> None:
        # Create an InstructionSpec object
        operand = OperandSpec(values=['rax', 'rbx'], type_=OT.REG, src=True, dest=False)
        instruction_spec = InstructionSpec(name='MOV', category='MOV')
        instruction_spec.operands.append(operand)

        # Create an Instruction object from the InstructionSpec object
        instruction = Instruction.from_spec(instruction_spec)

        # Assert the properties of the Instruction object
        self.assertEqual(instruction.name, 'MOV')
        self.assertEqual(instruction.category, 'MOV')
        self.assertFalse(instruction.is_control_flow)
        self.assertFalse(instruction.is_instrumentation)
        self.assertFalse(instruction.is_noremove)
        self.assertFalse(instruction.is_from_template)
        self.assertEqual(len(instruction.operands), 0)  # Operands are generated separately!
        self.assertEqual(len(instruction.implicit_operands), 0)

    def test_instruction_str(self) -> None:
        # Create an Instruction object
        operand = RegisterOp("rax", 64, True, False)
        instruction = Instruction("MOV", "MOV")
        instruction.operands.append(operand)

        # Assert the string representation of the Instruction object
        self.assertEqual(str(instruction), "MOV rax")

    def test_instr_add_op(self) -> None:
        instruction = Instruction("MOV", "MOV")
        operand = RegisterOp("rax", 64, True, False)
        implicit_operand = RegisterOp("rbx", 64, True, False)

        # Add explicit operand
        instruction = instruction.add_op(operand)
        self.assertEqual(len(instruction.operands), 1)
        self.assertEqual(instruction.operands[0], operand)

        # Add implicit operand
        instruction = instruction.add_op(implicit_operand, implicit=True)
        self.assertEqual(len(instruction.implicit_operands), 1)
        self.assertEqual(instruction.implicit_operands[0], implicit_operand)

    def test_instr_properties(self) -> None:
        # Case 1: Instruction with no memory operands
        instruction = Instruction("MOV", "MOV")
        op_reg = RegisterOp("rax", 64, True, False)
        instruction.operands.append(op_reg)

        self.assertFalse(instruction.has_mem_operand(include_implicit=True))
        self.assertFalse(instruction.has_write(include_implicit=True))
        self.assertFalse(instruction.has_read(include_implicit=True))

        # Case 2: Instruction with an explicit read
        instruction = Instruction("MOV", "MOV")
        op = MemoryOp("0x0", 64, True, False)
        instruction.operands.append(op)

        self.assertTrue(instruction.has_mem_operand(include_implicit=False))
        self.assertTrue(instruction.has_mem_operand(include_implicit=True))
        self.assertFalse(instruction.has_write(include_implicit=True))
        self.assertTrue(instruction.has_read(include_implicit=True))

        # Case 3: Instruction with an explicit write
        instruction = Instruction("MOV", "MOV")
        op = MemoryOp("0x0", 64, False, True)
        instruction.operands.append(op)

        self.assertTrue(instruction.has_mem_operand(include_implicit=False))
        self.assertTrue(instruction.has_mem_operand(include_implicit=True))
        self.assertTrue(instruction.has_write(include_implicit=True))
        self.assertFalse(instruction.has_read(include_implicit=True))

        # Case 4: Instruction with an implicit read
        instruction = Instruction("MOV", "MOV")
        op = MemoryOp("0x0", 64, True, False)
        instruction.implicit_operands.append(op)

        self.assertFalse(instruction.has_mem_operand(include_implicit=False))
        self.assertTrue(instruction.has_mem_operand(include_implicit=True))
        self.assertFalse(instruction.has_write(include_implicit=True))
        self.assertTrue(instruction.has_read(include_implicit=True))

        # Case 5: Instruction with an implicit write
        instruction = Instruction("MOV", "MOV")
        op = MemoryOp("0x0", 64, False, True)
        instruction.implicit_operands.append(op)

        self.assertFalse(instruction.has_mem_operand(include_implicit=False))
        self.assertTrue(instruction.has_mem_operand(include_implicit=True))
        self.assertTrue(instruction.has_write(include_implicit=True))
        self.assertFalse(instruction.has_read(include_implicit=True))

    def test_operand_accessors(self) -> None:
        reg_op = RegisterOp("rax", 64, True, False)
        mem_op = MemoryOp("0x0", 64, True, True)
        imm_op = ImmediateOp("0x0", 64)
        label_op = LabelOp("label")
        agen_op = AgenOp("0x0", 64)
        cond_op = CondOp("cond")
        flags_op = FlagsOp(("", "", "", "", "", "", "", "", ""))

        # Case 1: Explicit operands
        instruction = Instruction("MOV", "MOV")
        instruction.operands.extend([reg_op, mem_op, imm_op, label_op, agen_op, cond_op, flags_op])

        self.assertEqual(instruction.get_all_operands(),
                         [reg_op, mem_op, imm_op, label_op, agen_op, cond_op, flags_op])
        self.assertEqual(instruction.get_src_operands(),
                         [reg_op, mem_op, imm_op, label_op, agen_op, cond_op])
        self.assertEqual(instruction.get_dest_operands(), [mem_op])
        self.assertEqual(instruction.get_mem_operands(), [mem_op])
        self.assertEqual(instruction.get_flags_operand(), flags_op)
        self.assertEqual(instruction.get_reg_operands(), [reg_op])
        self.assertEqual(instruction.get_cond_operand(), cond_op)
        self.assertEqual(instruction.get_label_operand(), label_op)
        self.assertEqual(instruction.get_imm_operands(), [imm_op])

        # Case 2: Implicit operands
        instruction = Instruction("MOV", "MOV")
        instruction.implicit_operands.extend([reg_op, mem_op, imm_op, agen_op, flags_op])

        self.assertEqual(instruction.get_all_operands(),
                         [reg_op, mem_op, imm_op, agen_op, flags_op])
        self.assertEqual(instruction.get_src_operands(), [])
        self.assertEqual(
            instruction.get_src_operands(include_implicit=True), [reg_op, mem_op, imm_op, agen_op])
        self.assertEqual(instruction.get_dest_operands(), [])
        self.assertEqual(instruction.get_dest_operands(include_implicit=True), [mem_op])
        self.assertEqual(instruction.get_mem_operands(), [])
        self.assertEqual(instruction.get_mem_operands(include_implicit=True), [mem_op])
        self.assertEqual(instruction.get_flags_operand(), flags_op)
        self.assertEqual(instruction.get_reg_operands(), [])
        self.assertEqual(instruction.get_reg_operands(include_implicit=True), [reg_op])
        self.assertEqual(instruction.get_cond_operand(), None)
        self.assertEqual(instruction.get_label_operand(), None)
        self.assertEqual(instruction.get_imm_operands(), [])
        self.assertEqual(instruction.get_imm_operands(include_implicit=True), [imm_op])

        # Case 3: No operands
        instruction = Instruction("MOV", "MOV")

        self.assertEqual(instruction.get_all_operands(), [])
        self.assertEqual(instruction.get_src_operands(True), [])
        self.assertEqual(instruction.get_dest_operands(True), [])
        self.assertEqual(instruction.get_mem_operands(True), [])
        self.assertEqual(instruction.get_flags_operand(), None)
        self.assertEqual(instruction.get_reg_operands(True), [])

    def test_copy_with_modification(self) -> None:
        # pylint: disable=protected-access

        # Create an Instruction object
        org_instruction = Instruction(
            "MOV", "MOV", is_control_flow=False, is_instrumentation=False, is_noremove=False)
        org_instruction.is_from_template = True
        org_instruction._section_id = 1
        org_instruction._section_offset = 1
        org_instruction._line_num = 1
        org_instruction._size = 1

        # Add operands
        reg_op = RegisterOp("rax", 64, True, False)
        org_instruction.operands.append(reg_op)

        # Copy with no modification
        new_instruction = copy_inst_with_modification(org_instruction)
        self.assertEqual(new_instruction.name, "MOV")
        self.assertEqual(new_instruction.category, "MOV")
        self.assertFalse(new_instruction.is_control_flow)
        self.assertFalse(new_instruction.is_instrumentation)
        self.assertFalse(new_instruction.is_noremove)
        self.assertTrue(new_instruction.is_from_template)
        self.assertEqual(new_instruction._section_id, 1)
        self.assertEqual(new_instruction._section_offset, 1)
        self.assertEqual(new_instruction._line_num, 1)
        self.assertEqual(new_instruction._size, 1)
        self.assertEqual(new_instruction.operands, [reg_op])

        # Copy with modifications
        new_instruction = copy_inst_with_modification(
            org_instruction,
            name="NOP",
            category="NOP",
            is_control_flow=True,
            is_instrumentation=True,
            is_noremove=True)
        self.assertEqual(new_instruction.name, "NOP")
        self.assertEqual(new_instruction.category, "NOP")
        self.assertTrue(new_instruction.is_control_flow)
        self.assertTrue(new_instruction.is_instrumentation)
        self.assertTrue(new_instruction.is_noremove)
        self.assertTrue(new_instruction.is_from_template)
        self.assertEqual(new_instruction._section_id, 1)
        self.assertEqual(new_instruction._section_offset, 1)
        self.assertEqual(new_instruction._line_num, 1)
        self.assertEqual(new_instruction._size, 1)
        self.assertEqual(new_instruction.operands, [reg_op])

    def test_line_num_interface(self) -> None:
        # Check unassigned line number
        instruction = Instruction("MOV", "MOV")
        with self.assertRaises(AssertionError):
            instruction.line_num()

        # Check valid line number
        instruction._line_num = 10  # Assuming _line_num is a protected attribute
        self.assertEqual(instruction.line_num(), 10)


class TestCaseBinaryTest(unittest.TestCase):

    def test_get_macro_offset(self) -> None:
        # Create an instance of TestCaseBinary
        test_case_code = TestCaseProgram("")
        test_case_bin = TestCaseBinary("", test_case_code)

        # Handling of non-assigned macro table
        with self.assertRaises(AssertionError):
            test_case_bin.get_macro_offset(1)

        # Mock the _symbol_table with symbols containing the desired macro_type
        symbol1 = SymbolTableEntry(sid=0, offset=1, type_=1, arg=0)
        symbol2 = SymbolTableEntry(sid=0, offset=10, type_=2, arg=0)
        symbol_table = [symbol1, symbol2]
        test_case_bin.assign_elf_data(symbol_table, MagicMock())

        # Call get_macro_offset and assert the returned offset
        self.assertEqual(test_case_bin.get_macro_offset(1), 1)
        self.assertEqual(test_case_bin.get_macro_offset(2), 10)

        # Check non-existing macro type
        self.assertEqual(test_case_bin.get_macro_offset(3), -1)


class TestCaseCodeTest(unittest.TestCase):

    def test_basic_block_str(self) -> None:
        bb = BasicBlock("bb1", MagicMock())
        self.assertEqual(str(bb), "bb1")

    def test_basic_block_get_owner(self) -> None:
        # Normal case
        actor = Actor.create_main()
        section = CodeSection(actor)
        func = Function("func1", section)
        bb = BasicBlock("bb1", func)

        self.assertEqual(bb.get_owner(), actor)

        # No-parent BB
        bb = BasicBlock("bb1", None)
        with self.assertRaises(AssertionError):
            bb.get_owner()


class InputDataTest(unittest.TestCase):

    def test_data_sizes(self) -> None:
        # Test data_size_per_actor
        self.assertEqual(InputData.data_size_per_actor(), _ACTOR_DATA_SIZE)

        # Test n_data_entries_per_actor
        self.assertEqual(InputData.n_data_entries_per_actor(), _ACTOR_DATA_SIZE // 8)

    def test_hash(self) -> None:
        input_data = InputData(1)
        self.assertEqual(hash(input_data), hash(input_data.tobytes()))

    def test_str(self) -> None:
        input_data = InputData(1)
        input_data.seed = 42
        self.assertEqual(str(input_data), "42")
        self.assertEqual(repr(input_data), "42")

    def test_set_actor_data(self) -> None:
        # Create an instance of InputData
        input_data = InputData(1)

        # Attempt setting data with invalid shape
        data = np.zeros((1,), dtype=np.uint64)
        with self.assertRaises(AssertionError):
            input_data.set_actor_data(0, data)

        # Set the actor data with a valid shape
        size = input_data.itemsize // 8
        data = np.ndarray((size,), dtype=np.uint64)
        data.fill(42)
        input_data.set_actor_data(0, data)
        self.assertEqual(input_data[0]["main"][0], 42)

    def test_save(self) -> None:
        # Create an instance of InputData
        input_data = InputData(1)
        data = np.array([42 for _ in range(input_data.itemsize // 8)], dtype=np.uint64)
        input_data.set_actor_data(0, data)

        # Create a temporary binary file
        with tempfile.NamedTemporaryFile(delete=False) as f:
            path = f.name

        # Save the input data to the binary file
        input_data.save(path)

        # Check the contents of the binary file
        with open(path, 'rb') as f:
            contents = np.fromfile(f, dtype=np.uint64)
            self.assertEqual(contents[0], 42)

        # Remove the temporary binary file
        os.unlink(path)

    def test_load(self) -> None:
        input_data = InputData(1)

        # Create a temporary binary file
        with tempfile.NamedTemporaryFile(delete=False) as f:
            path = f.name
        data = np.array([42 for _ in range(input_data.itemsize // 8)], dtype=np.uint64)
        with open(path, 'wb') as f:
            f.write(data.tobytes())

        # Load the input data from the binary file
        input_data.load(path)
        self.assertEqual(input_data[0]["main"][0], 42)

        # Remove the temporary binary file
        os.unlink(path)

    def test_linear_view(self) -> None:
        input_data = InputData(1)
        data = np.array([42 for _ in range(input_data.itemsize // 8)], dtype=np.uint64)
        input_data.set_actor_data(0, data)

        # Get the linear view of the input for the actor
        linear_view = input_data.linear_view(0)

        # Assert the shape of the linear view
        self.assertEqual(linear_view.shape, (input_data.itemsize // 8,))

        # Assert the contents of the linear view
        self.assertEqual(linear_view[0], 42)


================================================
FILE: tests/unit_traces.py
================================================
"""
File: Collection of unit tests for rvzr/traces.py

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""

# Note: We relax the pylint rules in unit tests to allow for more introspection, and also
#       because test readability is less critical.
# pylint: disable=missing-function-docstring,missing-class-docstring,too-many-public-methods

from __future__ import annotations

import unittest
import unittest.mock
import xxhash
import numpy as np

from rvzr.traces import CTraceEntry, CTrace, HTrace, RawHTraceSample, HardwareEqClass, \
    TraceBundle, ContractEqClass, Violation
from rvzr.tc_components.test_case_data import InputData, InputID
from rvzr.tc_components.test_case_code import TestCaseProgram


class TestCTrace(unittest.TestCase):
    """ Unit tests for CTrace and related classes """

    def test_empty_constructor(self) -> None:
        # Test `empty_trace` interface
        trace = CTrace.empty_trace()
        self.assertIsInstance(trace, CTrace)
        self.assertTrue(trace.is_empty())
        self.assertEqual(trace, CTrace([]))

    def test_str(self) -> None:
        # Test `__str__` interface
        # 1. Normal case
        values = [0x0, 0x100]
        entries = [CTraceEntry("val", i) for i in values]
        trace = CTrace(entries)
        hash_ = xxhash.xxh64(str(values), seed=0).intdigest()
        self.assertEqual(str(trace), str(hash_))

        # 2. Special case - L1D map
        trace.set_printed_as_l1d(True)
        l1d_map = '^...^...........................................................'
        self.assertEqual(str(trace), l1d_map)

    def test_full_str(self) -> None:
        # Test `full_str` interface
        entries = [
            CTraceEntry("mem", 0),
            CTraceEntry("pc", 0),
            CTraceEntry("ind", 0),
            CTraceEntry("val", 0),
            CTraceEntry("reg", 0),
        ]
        trace = CTrace(entries)
        m_col, pc_col, val_col, reset_col = "m|", "p|", "v|", "r|"

        # 1. Normal case
        expected_x86 = "[mem: m|0x0r|, pc: p|0x0r|, indcall: p|0x0r|, val: v|0x0r|, rsi: 0x0r|]"
        expected_arm = "[mem: m|0x0r|, pc: p|0x0r|, indcall: p|0x0r|, val: v|0x0r|, x4: 0x0r|]"
        self.assertIn(
            trace.full_str(m_col, pc_col, val_col, reset_col), [expected_x86, expected_arm])

        # 2. Default colors
        expected_x86 = "[mem: 0x0, pc: 0x0, indcall: 0x0, val: 0x0, rsi: 0x0]"
        expected_arm = "[mem: 0x0, pc: 0x0, indcall: 0x0, val: 0x0, x4: 0x0]"
        self.assertIn(trace.full_str(), [expected_x86, expected_arm])

        # 3. Invalid color combination
        with self.assertRaises(AssertionError):
            trace.full_str("m|", "p|", "v|")

    def test_default_methods(self) -> None:
        # Test default methods: `__eq__`, `__lt__`, `__gt__`, `__len__`, `__hash__`
        entries = [CTraceEntry("val", i) for i in range(5)]
        trace1 = CTrace(entries)
        trace2 = CTrace(entries)
        trace3 = CTrace([CTraceEntry("val", 10)])

        # __eq__
        self.assertEqual(trace1, trace2)
        self.assertNotEqual(trace1, trace3)
        with self.assertRaises(NotImplementedError):
            _ = trace1 == "not a trace"

        # __lt__ and __gt__
        self.assertFalse(trace1 < trace2)
        self.assertFalse(trace1 > trace2)

        # __len__
        self.assertEqual(len(trace1), 5)

        # __hash__
        self.assertEqual(hash(trace1), hash(trace2))
        self.assertNotEqual(hash(trace1), hash(trace3))

    def test_accessors(self) -> None:
        # Test accessors: `get_untyped`, `get_typed`, `is_empty`
        entries = [CTraceEntry("val", i) for i in range(5)]
        trace = CTrace(entries)

        # get_untyped
        untyped = trace.get_untyped()
        self.assertEqual(untyped, [0, 1, 2, 3, 4])

        # get_typed
        typed = trace.get_typed()
        self.assertEqual(typed, entries)

        # is_empty
        self.assertFalse(trace.is_empty())
        empty_trace = CTrace.empty_trace()
        self.assertTrue(empty_trace.is_empty())


class TestHTrace(unittest.TestCase):
    """ Unit tests for HTrace and related classes """

    def test_empty_constructor(self) -> None:
        # Test `empty_trace` interface
        trace = HTrace.empty_trace()
        self.assertIsInstance(trace, HTrace)
        self.assertTrue(trace.is_empty())
        self.assertEqual(trace, HTrace(np.ndarray(0, dtype=RawHTraceSample)))

    def test_invalid_constructor(self) -> None:
        # Test `invalid_trace` interface
        trace = HTrace.invalid_trace()
        self.assertIsInstance(trace, HTrace)
        self.assertTrue(trace.is_corrupted_or_ignored())

    def test_printers(self) -> None:
        # Test `__str__`, `full_str` interfaces
        # __str__
        entries = np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample)
        trace = HTrace(entries)
        hash_ = xxhash.xxh64(str(entries['trace']), seed=0).intdigest()
        self.assertEqual(str(trace), str(hash_))

        # full_str: empty trace
        empty_trace = HTrace.empty_trace()
        self.assertEqual(empty_trace.full_str(), "")

        # full_str: cache trace
        trace = HTrace(np.array([(0b10001, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        expected = "...........................................................^...^ [1]\n"
        self.assertEqual(trace.full_str(), expected)

        # full_str: TSC trace
        trace = HTrace(np.array([(256, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "tsc")
        expected = "00000256 [1]\n"
        self.assertEqual(trace.full_str(), expected)

        # full_str: architectural trace
        trace = HTrace(np.array([(0x1, 0x2, 0x3, 0x4, 0x5, 0x6)], dtype=RawHTraceSample), "reg")
        expected_x86 = "[rax: 0x1, rbx: 0x2, rcx: 0x3, rdx: 0x4, rsi: 0x5, rdi: 0x6]"
        expected_arm = "[x0: 0x1, x1: 0x2, x2: 0x3, x3: 0x4, x4: 0x5, x5: 0x6]"
        self.assertIn(trace.full_str(), [expected_x86, expected_arm])

    def test_pair_printers(self) -> None:
        # Test `full_pair_str` interface
        # cache traces
        trace1 = HTrace(np.array([(0b10001, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        trace2 = HTrace(np.array([(0b10010, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        expected = \
            "...........................................................^...^" \
            " | 1      | 0     |\n" \
            "...........................................................^..^." \
            " | 0      | 1     |\n"
        self.assertEqual(trace1.full_pair_str(trace2), expected)

        # TSC traces
        trace1 = HTrace(np.array([(256, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "tsc")
        trace2 = HTrace(np.array([(512, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "tsc")
        expected = "00000256 | 1      | 0      |\n"\
                   "00000512 | 0      | 1      |\n"
        self.assertEqual(trace1.full_pair_str(trace2), expected)

        # architectural traces
        trace1 = HTrace(np.array([(0x1, 0x2, 0x3, 0x4, 0x5, 0x6)], dtype=RawHTraceSample), "reg")
        trace2 = HTrace(np.array([(0x7, 0x8, 0x9, 0xa, 0xb, 0xc)], dtype=RawHTraceSample), "reg")
        # FIXME: the below assert is nonsensical, and it exists only to satisfy the coverage tool
        with self.assertRaises(NotImplementedError):
            trace1.full_pair_str(trace2)

    def test_default_methods(self) -> None:
        # Test default methods: `__eq__`, `__len__`, `__hash__`
        trace1 = HTrace(np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        trace2 = HTrace(np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        trace3 = HTrace(np.array([(0x200, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")

        # __eq__
        self.assertEqual(trace1, trace2)
        self.assertNotEqual(trace1, trace3)

        # __len__
        self.assertEqual(len(trace1), 1)
        self.assertEqual(len(trace3), 1)
        self.assertEqual(len(HTrace.empty_trace()), 0)

        # __hash__
        self.assertEqual(hash(trace1), hash(trace2))
        self.assertNotEqual(hash(trace1), hash(trace3))

    def test_merge(self) -> None:
        # Test `merge` method
        trace1 = HTrace(np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        trace2 = HTrace(np.array([(0x200, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache")
        merged_trace = trace1.merge(trace2)

        self.assertEqual(len(merged_trace), 2)
        self.assertEqual(merged_trace.get_raw_traces().tolist(), [0x100, 0x200])

    def test_accessors(self) -> None:
        # Test accessors: `get_raw_readings`, `get_raw_traces`, `sample_size`, `get_max_pfc`
        entries = np.array([(0x100, 1, 2, 3, 4, 5)], dtype=RawHTraceSample)
        trace = HTrace(entries)

        # get_raw_readings
        raw_readings = trace.get_raw_readings()
        self.assertTrue(np.array_equal(raw_readings, entries))

        # get_raw_traces
        raw_traces = trace.get_raw_traces()
        self.assertTrue(np.array_equal(raw_traces, entries['trace']))

        # sample_size
        self.assertEqual(trace.sample_size(), 1)
        self.assertEqual(HTrace.empty_trace().sample_size(), 0)

        # get_max_pfc
        self.assertEqual(trace.get_max_pfc(), (1, 2, 3, 4, 5))


def _get_bundle_set() -> list[TraceBundle]:
    trace_bundle1 = TraceBundle(
        input_id=InputID(1),
        input_=InputData(),
        ctrace=CTrace([CTraceEntry("val", 0)]),
        htrace=HTrace(np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache"))
    trace_bundle2 = TraceBundle(
        input_id=InputID(2),
        input_=InputData(),
        ctrace=CTrace([CTraceEntry("val", 0)]),
        htrace=HTrace(np.array([(0x100, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache"))
    trace_bundle3 = TraceBundle(
        input_id=InputID(3),
        input_=InputData(),
        ctrace=CTrace([CTraceEntry("val", 1)]),
        htrace=HTrace(np.array([(0x200, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache"))
    trace_bundle4 = TraceBundle(
        input_id=InputID(3),
        input_=InputData(),
        ctrace=CTrace([CTraceEntry("val", 1)]),
        htrace=HTrace(np.array([(0x300, 0, 0, 0, 0, 0)], dtype=RawHTraceSample), "cache"))
    return [trace_bundle1, trace_bundle2, trace_bundle3, trace_bundle4]


class TestHardwareEqClass(unittest.TestCase):
    """ Unit tests for HardwareEqClass"""

    def test_hw_class_builder(self) -> None:
        # Test `build_hw_classes`
        # Create hardware equivalence classes
        trace_bundles = _get_bundle_set()
        hw_classes = HardwareEqClass.build_hw_classes(trace_bundles)

        # Test grouping
        self.assertEqual(len(hw_classes), 3)
        self.assertEqual(hw_classes[0].htrace, trace_bundles[0].htrace)
        self.assertEqual(hw_classes[1].htrace, trace_bundles[2].htrace)
        self.assertEqual(hw_classes[0].measurements, [trace_bundles[0], trace_bundles[1]])
        self.assertEqual(hw_classes[1].measurements, [trace_bundles[2]])

    def test_default_methods(self) -> None:
        # Test default methods
        trace_bundles = _get_bundle_set()
        hw_classes = HardwareEqClass.build_hw_classes(trace_bundles)

        # __len__
        self.assertEqual(len(hw_classes[0]), 2)

        # __iter__
        for i, bundle in enumerate(hw_classes[0]):
            self.assertEqual(bundle, trace_bundles[i])

        # __getitem__
        self.assertEqual(hw_classes[0][0], trace_bundles[0])

        # __eq__
        self.assertNotEqual(hw_classes[0], hw_classes[1])
        with self.assertRaises(NotImplementedError):
            _ = hw_classes[0] == "not a HardwareEqClass"


class TestContractEqClass(unittest.TestCase):
    """ Unit tests for ContractEqClass """

    def test_contract_class_builder(self) -> None:
        # Test `build_contract_classes`
        trace_bundles = _get_bundle_set()
        contract_classes = ContractEqClass.build_contract_classes(trace_bundles)

        # Test grouping
        self.assertEqual(len(contract_classes), 2)
        self.assertEqual(contract_classes[0].ctrace, trace_bundles[0].ctrace)
        self.assertEqual(len(contract_classes[0]), 2)
        self.assertEqual(contract_classes[0].measurements, trace_bundles[:2])
        self.assertEqual(contract_classes[1].ctrace, trace_bundles[2].ctrace)
        self.assertEqual(contract_classes[1].measurements, trace_bundles[2:])

    def test_accessors(self) -> None:
        # Test accessors: `set_hw_classes`, `set_trivial_hw_classes`, `get_hw_classes`
        trace_bundles = _get_bundle_set()
        contract_classes = ContractEqClass.build_contract_classes(trace_bundles)

        # get_hw_classes - failing case
        with self.assertRaises(AssertionError):
            _ = contract_classes[0].get_hw_classes()

        # set_hw_classes
        hw_classes = HardwareEqClass.build_hw_classes(trace_bundles)
        contract_classes[0].set_hw_classes(hw_classes)
        self.assertEqual(contract_classes[0].get_hw_classes(), hw_classes)
        with self.assertRaises(AssertionError):  # repeated setting forbidden
            contract_classes[0].set_hw_classes([])

        # set_trivial_hw_classes
        with self.assertRaises(AssertionError):
            contract_classes[0].set_trivial_hw_classes()
        contract_classes = ContractEqClass.build_contract_classes(trace_bundles)
        contract_classes[0].set_trivial_hw_classes()
        self.assertEqual(contract_classes[0].get_hw_classes()[0].htrace, hw_classes[0].htrace)
        self.assertEqual(contract_classes[0].get_hw_classes()[0], hw_classes[0])


class TestViolation(unittest.TestCase):
    """ Unit tests for Violation class """

    def test_constructors(self) -> None:
        # __init__
        measurements = _get_bundle_set()[2:]
        input_sequence = [m.input_ for m in measurements]
        test_case_code = unittest.mock.MagicMock(spec=TestCaseProgram)
        violation = Violation(measurements, input_sequence, test_case_code)
        violation.set_trivial_hw_classes()
        self.assertEqual(violation.input_sequence, input_sequence)
        self.assertEqual(violation.test_case_code, test_case_code)

        # from_contract_eq_class
        contract_class = ContractEqClass.build_contract_classes(measurements)[0]
        contract_class.set_trivial_hw_classes()
        violation_from_class = Violation.from_contract_eq_class(contract_class, input_sequence,
                                                                test_case_code)
        self.assertEqual(violation_from_class.input_sequence, input_sequence)
        self.assertEqual(violation_from_class.test_case_code, test_case_code)
        self.assertListEqual(violation_from_class.measurements, violation.measurements)
        self.assertEqual(violation_from_class.input_sequence, input_sequence)

        # pseudo_violation_from_inputs
        pseudo_violation = Violation.pseudo_violation_from_inputs(input_sequence, test_case_code)
        self.assertEqual(pseudo_violation.input_sequence, input_sequence)
        self.assertEqual(pseudo_violation.test_case_code, test_case_code)
        self.assertTrue(pseudo_violation.measurements[0].ctrace.is_empty())
        self.assertTrue(pseudo_violation.measurements[0].htrace.is_empty())


================================================
FILE: tests/x86_tests/__init__.py
================================================


================================================
FILE: tests/x86_tests/asm/actor_switch.asm
================================================
.intel_syntax noprefix
.section .data.main

.function_start:
    # delay on rbx
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    lea rbx, qword ptr [rbx + rcx + 1]
    and rbx, 0b1

    .macro.switch.actor2.function_1:
# end of function_start
# --------------------------------------------------------------------------------------------------

.function_fin:
    .bb0:
    nop
# end of function_fin
# --------------------------------------------------------------------------------------------------

.section .data.actor2
.function_1:
    # a typical spectre v1 gadget
    jz .l3
    .l1:
        # mask the memory access
        and rax, 0b111111000000
        mov rax, qword ptr [r14 + rax]
    jmp .l3
    .l2:
        # mov rax, qword ptr [r14 + 0x100]
    .l3:

    and rdx, 0b111111000000
    mov rax, qword ptr [r14 + rdx]
    mov rsi, 0x42

    .macro.switch.main.function_fin:
# end of function_1
# --------------------------------------------------------------------------------------------------

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/asm_basic.asm
================================================
.intel_syntax noprefix
.section .data.main

.function_0:
.bb_0:

  # line with a comment
nop # no operands
div rbx  # one operand
and rax, rax # two operands
and rax, 0b0111111000000 # immediate value - binary
and rax, 42 # immediate value - decimal
and rax, 0xfa # immediate value - hex
and rax, -1 # immediate value - negative
and rdi, r14  # reserved register
neg rax  # lowercase
mov rax, qword ptr [r14]  # load - simple addressing
mov rax, qword ptr [r14 + rbx]  # load - two parts
mov rax, qword ptr [r14 + rbx + 8]  # load - three parts
mov rax, qword ptr [r14 + rbx]  # store
lock adc dword ptr [r14 + rbx], eax  # lock prefix
and rax, rax # instrumentation

mov rdi, rdi # multiple matches


jmp .bb_1
  .bb_1:
      and rdi, 0b0111111000000 # indentation
     cmp qword ptr [ r14 + rdi ] , 59   # extra spaces
    and rdi, 0b0111111000000 # instrumentation
    cmpxchg byte ptr [r14 + rsi], sil

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/asm_multiactor.asm
================================================
.intel_syntax noprefix
.section .data.main

.function_0:
nop
nop

.section .data.guest_1
.function_1:
nop

.section .data.main
.function_2:
.bb0:
nop

# .section exit
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/asm_symbol.asm
================================================
.intel_syntax noprefix
.section .data.main

.macro.measurement_start: nop qword ptr [rax + 0xff]

nop

.macro.measurement_end: nop qword ptr [rax + 0xff]

and rax, rax

.function_1:

nop

.section .data.guest_1
.function_2:
nop


.test_case_exit:


================================================
FILE: tests/x86_tests/asm/calls.asm
================================================
.intel_syntax noprefix
.section .data.main
.function_0:
call .function_1
.function_1:
add rsp, 8
call .function_2
.function_2:
add rsp, 8
call .function_3
.function_3:
add rsp, 8
call .function_4
.function_4:
add rsp, 8
call .function_5
.function_5:
add rsp, 8
call .function_6
.function_6:
add rsp, 8
call .function_7
.function_7:
add rsp, 8
call .function_8
.function_8:
add rsp, 8
call .function_9
.function_9:
add rsp, 8
call .function_10
.function_10:
add rsp, 8
call .function_11
.function_11:
add rsp, 8
call .function_12
.function_12:
add rsp, 8
call .function_13
.function_13:
add rsp, 8
call .function_14
.function_14:
add rsp, 8
call .function_15
.function_15:
add rsp, 8
call .function_16
.function_16:
add rsp, 8
call .function_17
.function_17:
add rsp, 8
call .function_18
.function_18:
add rsp, 8
call .function_19
.function_19:
add rsp, 8
call .function_20
.function_20:
add rsp, 8
call .function_21
.function_21:
add rsp, 8
call .function_22
.function_22:
add rsp, 8
call .function_23
.function_23:
add rsp, 8
call .function_24
.function_24:
add rsp, 8
call .function_25
.function_25:
add rsp, 8
call .function_26
.function_26:
add rsp, 8
call .function_27
.function_27:
add rsp, 8
call .function_28
.function_28:
add rsp, 8
call .function_29
.function_29:
add rsp, 8
call .function_30
.function_30:
add rsp, 8
call .function_31
.function_31:
add rsp, 8
call .function_32
.function_32:
add rsp, 8
call .function_33
.function_33:
add rsp, 8
call .function_34
.function_34:
add rsp, 8
call .function_35
.function_35:
add rsp, 8
call .function_36
.function_36:
add rsp, 8
call .function_37
.function_37:
add rsp, 8
call .function_38
.function_38:
add rsp, 8
call .function_39
.function_39:
add rsp, 8
call .function_40
.function_40:
add rsp, 8
call .function_41
.function_41:
add rsp, 8
call .function_42
.function_42:
add rsp, 8
call .function_43
.function_43:
add rsp, 8
call .function_44
.function_44:
add rsp, 8
call .function_45
.function_45:
add rsp, 8
call .function_46
.function_46:
add rsp, 8
call .function_47
.function_47:
add rsp, 8
call .function_48
.function_48:
add rsp, 8
call .function_49
.function_49:
add rsp, 8
call .function_50
.function_50:
add rsp, 8
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/direct_jumps.asm
================================================
.intel_syntax noprefix
.section .data.main
jmp .1
.1:
jmp .2
.2:
jmp .3
.3:
jmp .4
.4:
jmp .5
.5:
jmp .6
.6:
jmp .7
.7:
jmp .8
.8:
jmp .9
.9:
jmp .10
.10:
jmp .11
.11:
jmp .12
.12:
jmp .13
.13:
jmp .14
.14:
jmp .15
.15:
jmp .16
.16:
jmp .17
.17:
jmp .18
.18:
jmp .19
.19:
jmp .20
.20:
jmp .21
.21:
jmp .22
.22:
jmp .23
.23:
jmp .24
.24:
jmp .25
.25:
jmp .26
.26:
jmp .27
.27:
jmp .28
.28:
jmp .29
.29:
jmp .30
.30:
jmp .31
.31:
jmp .32
.32:
jmp .33
.33:
jmp .34
.34:
jmp .35
.35:
jmp .36
.36:
jmp .37
.37:
jmp .38
.38:
jmp .39
.39:
jmp .40
.40:
jmp .41
.41:
jmp .42
.42:
jmp .43
.43:
jmp .44
.44:
jmp .45
.45:
jmp .46
.46:
jmp .47
.47:
jmp .48
.48:
jmp .49
.49:
jmp .50
.50:
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault-div-overflow-speculation.asm
================================================
.intel_syntax noprefix
.section .data.main

MOV ebx, 1
lfence
DIV bx

XOR rax, rcx
AND rax, 0b111111111111 # instrumentation
MOV rax, qword ptr [r14 + rax + 128]


.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault-div-zero-speculation.asm
================================================
.intel_syntax noprefix
.section .data.main
mov edx, 0
mov ebx, 0
div ebx
xor rax, rcx
and rax, 0b111111111111 # instrumentation
mov rax, qword ptr [r14 + rax + 128]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_INT1.asm
================================================
.intel_syntax noprefix
.section .data.main
.byte 0xf1  # int1
mov rax, qword ptr [r14 + 256]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_INT3.asm
================================================
.intel_syntax noprefix
.section .data.main
int3
mov rax, qword ptr [r14 + 256]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_UD.asm
================================================
.intel_syntax noprefix
.section .data.main
ud2
and rax, 0b111111111111 # instrumentation
mov rax, qword ptr [r14 + rax + 128]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_load.asm
================================================
.intel_syntax noprefix
.section .data.main
mov rax, qword ptr [r14 + 4096]
xor rax, rcx
and rax, 0b111111111111 # instrumentation
mov rax, qword ptr [r14 + rax]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_ooo_mem_access.asm
================================================
.intel_syntax noprefix
.section .data.main
mov rax, qword ptr [r14 + 4096 + 64]

# dependent memory access
and rbx, 0b111111111000 # instrumentation
mov rax, qword ptr [r14 + rbx]

# independent memory access
and rbx, 0b111111111000 # instrumentation
mov rax, qword ptr [r14 + rbx]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/fault_rmw.asm
================================================
.intel_syntax noprefix
.section .data.main
xadd qword ptr [r14 + 4096], rax
add rax, rbx
and rax, 0b111111111111 # instrumentation
mov rax, qword ptr [r14 + rax + 128]
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/macro_fault_handler.asm
================================================
.intel_syntax noprefix
.section .data.main
.function_main_0:

mov rbx, qword ptr [r14 + 0x300]
ud2
lfence

.macro.fault_handler:
mov rax, qword ptr [r14 + 0x200]


# ----------------------------- Exit    ------------------------------------------------------------
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/minimization-after.asm
================================================
.intel_syntax noprefix
.section .data.main
.function_main:
.macro.measurement_start: nop qword ptr [rax + 0xff]
and rax, 0b1111111111111 # instrumentation
or ebx, dword ptr [r14 + rax]  # speculation source ?
mov al, bl
xor ax, -2067
test al, -117 # instrumentation
and rax, 0b1111111111111 # instrumentation
mov qword ptr [r14 + rax], rcx  # speculation sink ?
.section .data.main
.function_end:
.macro.measurement_end: nop qword ptr [rax + 0xff]
.section .data.main
.test_case_exit:nop


================================================
FILE: tests/x86_tests/asm/minimization-before.asm
================================================
.intel_syntax noprefix
.section .data.main
.function_main:
.bb_main.entry:
jmp .bb_main.0
.bb_main.0:
test dil, 51
adc ax, -49
xor eax, ecx
and rax, 0b1111111111111 # instrumentation
or ebx, dword ptr [r14 + rax]
or al, bl
and rsi, 0b1111111111111 # instrumentation
xor byte ptr [r14 + rsi], al
setl bl
xor ax, -2067
lea si, qword ptr [rsi + rbx]
sbb cl, cl
and rdx, 0b1111111111111 # instrumentation
lock and dword ptr [r14 + rdx], -37
dec al
test al, -117 # instrumentation
and rax, 0b1111111111111 # instrumentation
xchg qword ptr [r14 + rax], rcx
movsx esi, cl
xadd rdi, rdi
.bb_main.exit:
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/model_flags_match.asm
================================================
.intel_syntax noprefix
.section .data.main
lfence
mov rax, r14

mov rbx, 0
mov rcx, 64
cmovb rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 128
cmovbe rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 192
cmovl rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 256
cmovle rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 320
cmovo rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 384
cmovp rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 448
cmovs rbx, rcx
mov rcx, qword ptr [rax + rbx]

mov rbx, 0
mov rcx, 512
cmovz rbx, rcx
mov rcx, qword ptr [rax + rbx]

// cmovnb
// cmovnbe
// cmovnl
// cmovnle
// cmovno
// cmovnp
// cmovns
// cmovnz
mfence
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/model_match.asm
================================================
.intel_syntax noprefix
.section .data.main

# empty - leaving initial reg values unchanged

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/model_match_memory.asm
================================================
.intel_syntax noprefix
.section .data.main

mov rax, qword ptr [r14]  # main page
add rax, qword ptr [r14 + 4096]  # faulty page

mov rbx, qword ptr [r14 - 8]  # underflow pad
add rbx, qword ptr [r14 + 4096 + 4096 + 320]  # overflow pad

mov rcx, qword ptr [r14 + 4096 + 4096]  # reg init
mov rdx, qword ptr [r14 + 4096 + 4096 + 48]  # patched flags
mov rsi, qword ptr [r14 + 4096 + 4096 + 64]  # simd init
mov rdi, r14


# uncomment the following to test the complete sandbox contents
# xor rax, rax
# xor rbx, rbx
# xor rcx, rcx
# xor rdx, rcx
# mov rdi, 0xff8
# .l1:
# add rax, qword ptr [r14 + rdi]
# add rbx, qword ptr [r14 + rdi + 0x1000]
# add rcx, qword ptr [r14 + rdi + 0x2000]
# sub rdi, 8
# jnz .l1
# .l1_exit:

# mov rdi, 0xef8
# .l2:
# add rdx, qword ptr [r14 + rdi - 0xf00]
# sub rdi, 8
# jnz .l2

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/model_match_xmm.asm
================================================
.intel_syntax noprefix
.section .data.main
movq rax, xmm0
movq rbx, xmm1
movq rdx, xmm2
movq rcx, xmm3
movq rsi, xmm4
movq rdi, xmm5
.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_ret.asm
================================================
.intel_syntax noprefix
.section .data.main

# speculative offset:
# these shifts generate a random page offset, 64-bit aligned
and rax, 0b111111000000
lfence

mov rcx, r14
add rsp, 8  # ensure that the call and ret use the first cache set

call .function_1

.unreachable:
// lfence  # if you uncomment this line, the speculation will stop
and rax, 0b110000000  # reduce the number of possibilities
mov rax, qword ptr [rcx + rax]  # speculative access
lfence

.function_1:
lea rdx, qword ptr [rip + .function_2]
mov qword ptr [rsp], rdx
ret

.function_2:
mov rdx, qword ptr [rcx + 64]
mfence

# clear to avoid failing the arch check
mov rcx, 0
mov rdx, 0

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v1.1.asm
================================================
.intel_syntax noprefix
.section .data.main
lfence

# reduce the entropy of rax
and rax, 0b111111000000

# delay the cond. jump
mov rcx, 0
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]

# reduce the entropy in rbx
and rbx, 0b1000000

cmp rbx, 0
je .l1  # misprediction
.l0:
    # rbx != 0
    mov qword ptr [r14], rax
    mov rdx, qword ptr [r14]
    mov rbx, qword ptr [r14 + rdx]
.l1:
mfence

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v1.asm
================================================
.intel_syntax noprefix
.section .data.main
lfence

# reduce the entropy of rax
and rax, 0b111111000000

# delay the cond. jump
mov rcx, 0
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]

# reduce the entropy in rbx
and rbx, 0b1000000

cmp rbx, 0
je .l1  # misprediction
.l0:
    # rbx != 0
    mov rax, qword ptr [r14 + rax]
jmp .l2
.l1:
    # rbx == 0
    #mov rax, qword ptr [r14 + 64]
.l2:
mfence

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v1_arch.asm
================================================
.intel_syntax noprefix
.section .data.main
lfence

# delay the cond. jump
mov rax, 0
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]

# reduce the entropy in rbx
and rbx, 0b1000000

cmp rbx, 0
je .l1  # misprediction
.l0:
    # rbx != 0
    mov rax, qword ptr [r14 + 1024]
    shl rax, 2
    and rax, 0b111111000000
    mov rax, qword ptr [r14 + rax] # leakage happens here
.l1:

mfence

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v1_independent.asm
================================================
# This test case is identical to spectre_v1 except the offset of the speculative mem. access
# is input-independent. Therefore, this test case must not be flagged.

.intel_syntax noprefix
.section .data.main
MOV rcx, r14

# input: ebx - a random value, eax - fixed value
MOV rax, 128
lfence

# no delay to increase the likelihood of a false positive
SHL rbx, 63
SHR rbx, 63

# speculation
CMP rbx, 0
JE .l1
.l0:
    # rbx != 0
    MOV rcx, qword ptr [rcx + rax]
JMP .l2
.l1:
    # rbx == 0
    MOV rcx, qword ptr [rcx]
.l2:
MFENCE

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v1_n2.asm
================================================
.intel_syntax noprefix
.section .data.main
lfence

# reduce the entropy of rax
and rax, 0b111111000000

# delay the cond. jump
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]

# reduce the entropy in rbx
and rbx, 0b1000000

cmp rbx, 0
je .l1  # misprediction
je .l1
.l0:
    # rbx != 0
    mov rax, qword ptr [r14 + rax]
jmp .l2
.l1:
    # rbx == 0
    #mov rax, qword ptr [r14 + 64]
.l2:
mfence

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v2.asm
================================================
.intel_syntax noprefix
.section .data.main

# reduce the entropy of rax
and rax, 0b111111000000

# prepare jump targets
lea rdx, qword ptr [rip + .l1]
lea rsi, qword ptr [rip + .l2]

# delay the jump
mov rcx, 0
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]
lea rbx, qword ptr [rbx + rcx + 1]
lea rbx, qword ptr [rbx + rcx - 1]

# reduce the entropy in rbx
and rbx, 0b11000000

# select a target based on the random value in rbx
cmp rbx, 0
cmove rsi, rdx

jmp rsi   # misprediction
.l0:
lfence
.l1:
    # rbx = 0
    mov rdx, qword ptr [r14 + rax]
.l2:
mfence

# override the targets to avoid failing the arch. check
mov rdx, 0
mov rsi, 0

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/spectre_v4.asm
================================================
.intel_syntax noprefix
.section .data.main

# the leaked value - rcx
# construct a page offset in the range [0x200; 0x900]
and rcx, 0b11100000000
add rcx, 0x200

# save the offset into [r14 + 0]
mov qword ptr [r14], rcx
mfence

# create a delay on rbx
mov rax, 0
and rbx, 0b111000
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]
lea rbx, qword ptr [rbx + rax + 1]
lea rbx, qword ptr [rbx + rax - 1]

# sequence of potentially aliasing store-load
# if rbx == 0, they alias and rdx = 0x40
# if rbx != 0, they do not alias and rdx = offset saved above
mov qword ptr [r14 + rbx], 0x40  # store offset 0x40
mov rdx, qword ptr [r14]  # load the offset; misprediction happens here

# dependent load with the offset
and rdx, 0b111111000000
mov rdx, qword ptr [r14 + rdx]
mfence

.test_case_exit:


================================================
FILE: tests/x86_tests/asm/vm_switch.asm
================================================
.intel_syntax noprefix
# ----------------------------- actor 1 ------------------------------------------------------------
.section .data.main
.function_main1:

.function_main2:
    .macro.set_h2g_target.actor2.function_a2:
    .macro.set_g2h_target.main.function_fin:
    .macro.switch_h2g.actor2:

.function_fin:
    .macro.landing_g2h:
    nop

# ----------------------------- actor 2 ------------------------------------------------------------
.section .data.actor2
.function_a2:
    .macro.landing_h2g:
    .macro.measurement_start:
    mov rax, qword ptr [r14 + 0x100]
    .macro.measurement_end:

    .macro.switch_g2h.main:

# ----------------------------- exit    ------------------------------------------------------------
.test_case_exit:


================================================
FILE: tests/x86_tests/configs/arch-actors.yaml
================================================
file: !include arch.yaml

actors:
  - actor2:
      - mode: "host"


================================================
FILE: tests/x86_tests/configs/arch-dr.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: architectural
model_backend: dynamorio
enable_priming: false
inputs_per_class: 1
logging_modes:
 - info
 - dbg_violation

program_size: 150
avg_mem_accesses: 50
max_bb_per_function: 3
min_bb_per_function: 3


================================================
FILE: tests/x86_tests/configs/arch-faults.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: architectural
enable_priming: false
inputs_per_class: 1
logging_modes:
 - info
 - dbg_violation

program_size: 300
avg_mem_accesses: 150
max_bb_per_function: 3
min_bb_per_function: 3

faults_allowlist:
  - opcode-undefined


================================================
FILE: tests/x86_tests/configs/arch.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: architectural
enable_priming: false
inputs_per_class: 1
logging_modes:
 - info
 - dbg_violation

program_size: 300
avg_mem_accesses: 150
max_bb_per_function: 3
min_bb_per_function: 3


================================================
FILE: tests/x86_tests/configs/archdiff.yaml
================================================
file: !include common.yaml
file: !include base-and-simd-categories.yaml

fuzzer: archdiff
enable_priming: false
inputs_per_class: 1
logging_modes:
 - info
#  - dbg_violation

program_size: 150
avg_mem_accesses: 100
max_bb_per_function: 3
min_bb_per_function: 3


================================================
FILE: tests/x86_tests/configs/base-and-simd-categories.yaml
================================================
instruction_categories:
- BASE-BINARY
- BASE-BITBYTE
- BASE-CMOV
- BASE-COND_BR
- BASE-CONVERT
- BASE-DATAXFER
- BASE-FLAGOP
- BASE-LOGICAL
- BASE-MISC
- BASE-NOP
- BASE-POP
- BASE-PUSH
- BASE-SEMAPHORE
- BASE-SETCC
- BASE-STRINGOP
- BASE-WIDENOP
- SSE-SSE
- SSE-DATAXFER
- SSE-MISC
- SSE2-DATAXFER
- SSE2-MISC
- CLFLUSHOPT-CLFLUSHOPT
- CLFSH-MISC


================================================
FILE: tests/x86_tests/configs/base-categories.yaml
================================================
instruction_categories:
- BASE-BINARY
- BASE-BITBYTE
- BASE-CMOV
- BASE-COND_BR
- BASE-CONVERT
- BASE-DATAXFER
- BASE-FLAGOP
- BASE-LOGICAL
- BASE-MISC
- BASE-NOP
- BASE-POP
- BASE-PUSH
- BASE-SEMAPHORE
- BASE-SETCC
- BASE-STRINGOP
- BASE-WIDENOP


================================================
FILE: tests/x86_tests/configs/common.yaml
================================================
data_generator_seed: 1234567
program_generator_seed: 1234567

# Acceptance tests do not require a large sample size
executor_sample_sizes:
  - 10

# No logging
logging_modes:
  -
  # - dbg_model
  # - dbg_dump_htraces
  # - dbg_dump_ctraces


================================================
FILE: tests/x86_tests/configs/copy.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml


================================================
FILE: tests/x86_tests/configs/ct-cond.yaml
================================================
file: !include common.yaml

contract_observation_clause: ct
contract_execution_clause:
  - cond


================================================
FILE: tests/x86_tests/configs/ct-deh.yaml
================================================
contract_observation_clause: ct
contract_execution_clause:
  - delayed-exception-handling


================================================
FILE: tests/x86_tests/configs/ct-seq.yaml
================================================
file: !include common.yaml

contract_observation_clause: ct
contract_execution_clause:
  - seq

================================================
FILE: tests/x86_tests/configs/div-detect.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml

faults_allowlist:
  - div-by-zero
  - div-overflow


================================================
FILE: tests/x86_tests/configs/div-verif.yaml
================================================
file: !include common.yaml

contract_execution_clause:
  - vspec-ops-div

faults_allowlist:
  - div-by-zero
  - div-overflow


================================================
FILE: tests/x86_tests/configs/exceptions.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml

faults_allowlist:
  - debug-register
  - breakpoint
  - opcode-undefined


================================================
FILE: tests/x86_tests/configs/fault-handler.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml

actors:
  - main:
    - data_properties:
      - present: false

executor_mode: F+R
logging_modes:
  - dbg_dump_htraces

faults_allowlist:
  - opcode-undefined


================================================
FILE: tests/x86_tests/configs/l1tf-p-verif.yaml
================================================
file: !include common.yaml

contract_execution_clause:
  - nullinj-fault

actors:
  - main:
    - data_properties:
      - present: false


================================================
FILE: tests/x86_tests/configs/l1tf-p.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml

actors:
  - main:
    - data_properties:
      - present: false


================================================
FILE: tests/x86_tests/configs/l1tf-w-verif.yaml
================================================
file: !include common.yaml

contract_execution_clause:
  - nullinj-fault

actors:
  - main:
    - data_properties:
      - writable: false


================================================
FILE: tests/x86_tests/configs/l1tf-w.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml

actors:
  - main:
    - data_properties:
      - writable: false


================================================
FILE: tests/x86_tests/configs/meltdown-verif.yaml
================================================
file: !include common.yaml

contract_execution_clause:
  - nullinj-fault

actors:
  - main:
    - data_properties:
      - user: true


================================================
FILE: tests/x86_tests/configs/meltdown.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml

actors:
  - main:
    - data_properties:
      - user: true


================================================
FILE: tests/x86_tests/configs/mpx-verif.yaml
================================================
file: !include common.yaml
file: !include ct-deh.yaml

faults_allowlist:
  - bounds-range-exceeded


================================================
FILE: tests/x86_tests/configs/mpx.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml

faults_allowlist:
  - bounds-range-exceeded


================================================
FILE: tests/x86_tests/configs/ssbp-detect.yaml
================================================
file: !include common.yaml

data_generator_seed: 400
x86_executor_enable_ssbp_patch: false


================================================
FILE: tests/x86_tests/configs/ssbp-verif.yaml
================================================
file: !include common.yaml

data_generator_seed: 400
x86_executor_enable_ssbp_patch: false

contract_execution_clause:
  - bpas


================================================
FILE: tests/x86_tests/configs/vm-switch.yaml
================================================
file: !include common.yaml
file: !include ct-seq.yaml


actors:
  - actor2:
      - mode: "guest"


================================================
FILE: tests/x86_tests/min_x86.json
================================================
[
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock adc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "add", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "add", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "add", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "and", "category": "BASE-LOGICAL", "is_control_flow": false,
  "operands": [
    {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
    {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
  ],
  "implicit_operands": [
    {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
  ]
},
  {"name": "and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock and", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsf", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bsr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "w", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bt", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bt", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0, "is_signed": false}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock btc", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "btr", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "bts", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock bts", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock bts", "category": "BASE-BITBYTE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "call", "category": "BASE-CALL", "is_control_flow": true,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "call", "category": "BASE-CALL", "is_control_flow": true,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "call", "category": "BASE-CALL", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "{disp32} call", "category": "BASE-CALL", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "cbw", "category": "BASE-CONVERT", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8}
    ]
  },
  {"name": "cdq", "category": "BASE-CONVERT", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32}
    ]
  },
  {"name": "clc", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cld", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "w", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cli", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "w", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmc", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmovbe", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmovno", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmovp", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmovz", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmp", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": false, "width": 64, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "r", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "r", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 16},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "r", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmpxchg8b", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ecx"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["ebx"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["", "", "", "w", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg8b", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ecx"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["ebx"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["", "", "", "w", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock cmpxchg", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cpuid", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ebx"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ecx"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32}
    ]
  },
  {"name": "cwd", "category": "BASE-CONVERT", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["dx"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "cwde", "category": "BASE-CONVERT", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock dec", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "div", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "enterw", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["bp"], "src": true, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "enter", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rbp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": true, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": true, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "idiv", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["undef", "undef", "undef", "undef", "undef", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": false, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": false, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "imul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },

  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock inc", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "iretd", "category": "BASE-RET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 160},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "w", "w", "w", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jb", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jb", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jbe", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jbe", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jl", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jl", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jle", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jle", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jmp", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "jmp", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "{disp32} jmp", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64}
    ]
  },
  {"name": "jmp", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64}
    ]
  },
  {"name": "jmp far", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "jmp far", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 48}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "jmp far", "category": "BASE-UNCOND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 80}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "jnb", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnb", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jnbe", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnbe", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jnl", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnl", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jnle", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnle", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jno", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jno", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jnp", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnp", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jns", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jns", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jnz", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jnz", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jo", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jo", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jp", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jp", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jrcxz", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64}
    ]
  },
  {"name": "js", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} js", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "jz", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{disp32} jz", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lahf", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ah"], "src": false, "dest": true, "width": 8},
      {"type_": "FLAGS", "values": ["r", "r", "r", "r", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lea", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "AGEN", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "leavew", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rbp"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["bp"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["sp"], "src": true, "dest": true, "width": 16}
    ]
  },
  {"name": "leave", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rbp"], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rbp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64}
    ]
  },
  {"name": "lfs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["fs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lfs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 48}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["fs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lfs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 80}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["fs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lgs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["gs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lgs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 48}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["gs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lgs", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 80}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["gs"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lodsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lodsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lodsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "loop", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64}
    ]
  },
  {"name": "loope", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "loopne", "category": "BASE-COND_BR", "is_control_flow": true,
    "operands": [
      {"type_": "LABEL", "values": [], "src": true, "dest": false, "width": 0}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lss", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ss"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lss", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 48}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ss"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "lss", "category": "BASE-SEGOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 80}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ss"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "{load} mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["es", "cs", "ss", "ds", "fs", "gs"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["es", "cs", "ss", "ds", "fs", "gs"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["es", "cs", "ss", "ds", "fs", "gs"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["es", "cs", "ss", "ds", "fs", "gs"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["es", "ss", "ds", "fs", "gs"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["es", "ss", "ds", "fs", "gs"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": false, "dest": true, "width": 8, "magic": true},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16, "magic": true},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": false, "dest": true, "width": 32, "magic": true},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": false, "dest": true, "width": 64, "magic": true},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16, "magic": true}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32, "magic": true}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax"], "src": true, "dest": false, "width": 64, "magic": true}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "movsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "movsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "movsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movsx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "movzx", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["cr0", "cr2", "cr3", "cr4", "cr8"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["cr0", "cr2", "cr3", "cr4", "cr8"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["dr0", "dr1", "dr2", "dr3", "dr4", "dr5", "dr6", "dr7"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mov", "category": "BASE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["dr0", "dr1", "dr2", "dr3", "dr4", "dr5", "dr6", "dr7"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": false, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["dx"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["edx"], "src": false, "dest": true, "width": 32},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "mul", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rdx"], "src": false, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "undef", "undef", "undef", "undef", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock neg", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "nop", "category": "BASE-NOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "nop", "category": "BASE-WIDENOP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "lock not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "lock not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": []
  },
  {"name": "lock not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": []
  },
  {"name": "lock not", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": []
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock or", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": false, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "popw", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["fs"], "src": false, "dest": true, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["fs"], "src": false, "dest": true, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "popw", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["gs"], "src": false, "dest": true, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 16}
    ]
  },
  {"name": "pop", "category": "BASE-POP", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["gs"], "src": false, "dest": true, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "popfw", "category": "BASE-POP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 16},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "w", "w", "w", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "pushw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "pushw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "pushw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "pushw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["fs"], "src": true, "dest": false, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["fs"], "src": true, "dest": false, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "pushw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["gs"], "src": true, "dest": false, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16}
    ]
  },
  {"name": "push", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["gs"], "src": true, "dest": false, "width": 16, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 64}
    ]
  },
  {"name": "pushfw", "category": "BASE-PUSH", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": false, "dest": true, "width": 16},
      {"type_": "FLAGS", "values": ["r", "r", "r", "r", "r", "r", "r", "r", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcl", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rcr", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r/w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe cmpsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe cmpsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe cmpsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe scasb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe scasd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe scasw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne cmpsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne cmpsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne cmpsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne scasb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne scasd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne scasw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16},
      {"type_": "MEM", "values": ["rdi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["cw", "cw", "cw", "r/cw", "cw", "", "", "r", "cw"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe lodsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne lodsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["al"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe lodsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne lodsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["eax"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe lodsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne lodsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ax"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe movsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne movsb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe movsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne movsd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe movsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne movsw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "MEM", "values": ["rsi"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe stosb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne stosb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe stosd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne stosd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repe stosw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "repne stosw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16},
      {"type_": "REG", "values": ["rcx"], "src": true, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "retfw", "category": "BASE-RET", "is_control_flow": true,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 32}
    ]
  },
  {"name": "retf", "category": "BASE-RET", "is_control_flow": true,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "retfq", "category": "BASE-RET", "is_control_flow": true,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 128}
    ]
  },
  {"name": "retfw", "category": "BASE-RET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 32}
    ]
  },
  {"name": "retf", "category": "BASE-RET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "retfq", "category": "BASE-RET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 128}
    ]
  },
  {"name": "ret", "category": "BASE-RET", "is_control_flow": true,
    "operands": [
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "ret", "category": "BASE-RET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rsp"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "MEM", "values": ["rsp"], "src": true, "dest": false, "width": 64}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rol", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ror", "category": "BASE-ROTATE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "rsm", "category": "BASE-SYSRET", "is_control_flow": true,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["rip"], "src": false, "dest": true, "width": 64},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "w", "w", "w", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sahf", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "REG", "values": ["ah"], "src": true, "dest": false, "width": 8},
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sar", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnb", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnbe", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["r", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnl", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnle", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "r", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setno", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setno", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setno", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setns", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setns", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setns", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setnz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "seto", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "seto", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "seto", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "", "r"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setp", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "r", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sets", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sets", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sets", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "r", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "setz", "category": "BASE-SETCC", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": false, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shl", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shld", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shr", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": ["1"], "src": true, "dest": false, "width": 8, "magic": true}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": []
  },
  {"name": "shrd", "category": "BASE-SHIFT", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8, "is_signed": false}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "undef"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "stc", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "", "", "", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "std", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "w", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sti", "category": "BASE-FLAGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "w", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "stosb", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "stosd", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "stosw", "category": "BASE-STRINGOP", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": [
      {"type_": "MEM", "values": ["rdi"], "src": false, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16},
      {"type_": "FLAGS", "values": ["", "", "", "", "", "", "", "r", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "r8b", "r9b", "r10b", "r11b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["spl", "bpl", "sil", "dil", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "{load} sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": true, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": true, "width": 16, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": true, "width": 32, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": true, "width": 64, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock sub", "category": "BASE-BINARY", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al"], "src": true, "dest": false, "width": 8, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ax"], "src": true, "dest": false, "width": 16, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["eax"], "src": true, "dest": false, "width": 32, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "test", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax"], "src": true, "dest": false, "width": 64, "magic": true},
      {"type_": "IMM", "values": [], "src": true, "dest": false, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "ud2", "category": "BASE-MISC", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": []
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil", "r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["al", "cl", "dl", "bl"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8},
      {"type_": "REG", "values": ["ah", "ch", "dh", "bh"], "src": true, "dest": true, "width": 8}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 16},
      {"type_": "REG", "values": ["ax", "cx", "dx", "bx", "sp", "bp", "si", "di", "r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"], "src": true, "dest": true, "width": 16}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 32},
      {"type_": "REG", "values": ["eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi", "r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"], "src": true, "dest": true, "width": 32}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xadd", "category": "BASE-SEMAPHORE", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "w", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lock xor", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "xor", "category": "BASE-LOGICAL", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["w", "w", "undef", "w", "w", "", "", "", "w"], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "lfence", "category": "SSE2-MISC", "is_control_flow": false,
    "operands": [

    ],
    "implicit_operands": []
  },
  {"name": "cmovz", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "cmovnz", "category": "BASE-CMOV", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": false, "dest": true, "width": 64},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": [
      {"type_": "FLAGS", "values": ["", "", "", "r", "", "", "", "", ""], "src": false, "dest": false, "width": 0}
    ]
  },
  {"name": "movaps", "category": "SSE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": false, "dest": true, "width": 128},
      {"type_": "MEM", "values": [], "src": true, "dest": false, "width": 128}
    ],
    "implicit_operands": []
  },
  {"name": "movaps", "category": "SSE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": false, "dest": true, "width": 128},
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": true, "dest": false, "width": 128}
    ],
    "implicit_operands": []
  },
  {"name": "movaps", "category": "SSE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "MEM", "values": [], "src": false, "dest": true, "width": 128},
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": true, "dest": false, "width": 128}
    ],
    "implicit_operands": []
  },
  {"name": "movaps", "category": "SSE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": false, "dest": true, "width": 128},
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": true, "dest": false, "width": 128}
    ],
    "implicit_operands": []
  },
  {"name": "movhps", "category": "SSE-DATAXFER", "is_control_flow": false,
    "operands": [
      {"type_": "REG", "xtype": "f32", "values": ["xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15"], "src": false, "dest": true, "width": 128},
      {"type_": "REG", "values": ["rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi", "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"], "src": true, "dest": false, "width": 64}
    ],
    "implicit_operands": []
  }
]


================================================
FILE: tests/x86_tests/model_common.py
================================================
"""
File: Collection of helper classes for x86 model tests.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
from __future__ import annotations
from typing import List, Generator, Literal
from dataclasses import dataclass

import os
import tempfile
from pathlib import Path

from rvzr.tc_components.test_case_code import TestCaseProgram
from rvzr.tc_components.test_case_data import InputData
from rvzr.isa_spec import InstructionSet
from rvzr.elf_parser import ELFParser
from rvzr.arch.x86.target_desc import X86TargetDesc
from rvzr.arch.x86.asm_parser import X86AsmParser
from rvzr.arch.x86.generator import X86Generator
from rvzr.config import CONF

test_path = Path(__file__).resolve()
test_dir = test_path.parent

ASM_HEADER = """
.intel_syntax noprefix
.section .data.main
"""

# Base addresses for calculating expected contract traces
PC0 = 0x8  # Initial program counter offset for Unicorn backend
DATA_BASE = 0x1000000  # Base address for data section in test environment
CODE_BASE = 0x8000  # Base address for code section in test environment
MAIN_OFFSET = 0x1000  # Offset for main actor code section
FAULTY_OFFSET = 0x2000  # Offset for faulty actor code section

# Default values for memory and registers in test inputs
MEM_DEFAULT_VALUE = 1
REG_DEFAULT_VALUE = 2
MEM_FAULTY_DEFAULT_VALUE = 3
RSP_DEFAULT_VALUE = FAULTY_OFFSET - 8

# Register indices for x86-64 (used in test input array indexing)
RAX, RBX, RCX, RDX, RSI, RDI, FLAGS, RSP = 0, 1, 2, 3, 4, 5, 6, 7
NUM_TEST_GPRS = 7  # Number of GPRs initialized in default test inputs

# SIMD register indices
XMM0, XMM1 = 0, 1

Backend = Literal["dr", "uc"]


@dataclass
class Inst:
    """Instruction with its size and memory address."""
    text: str
    size: int
    mem_address: int
    mem_value: int
    pc_offset: int = 0


class InstList:
    """List of instructions with their memory addresses."""
    instructions: List[Inst]

    def __init__(self, instructions: List[Inst], backend: Backend):
        self.backend = backend
        self.start_offset = PC0 if backend == "uc" else 0

        # Wrap instructions with backend-specific macros
        wrapped = self._wrap_instructions_for_backend(instructions)
        self.set_offsets(wrapped)
        self.instructions = wrapped

    def _wrap_instructions_for_backend(self, instructions: List[Inst]) -> List[Inst]:
        if self.backend == "dr":
            return self._wrap_instructions_for_dr(instructions)
        # uc
        return self._wrap_instructions_for_uc(instructions)

    def _wrap_instructions_for_dr(self, instructions: List[Inst]) -> List[Inst]:
        """
        DynamoRIO test cases are wrapped in measurement macros plus a NOP at test_case_exit.
        """
        wrapped = []
        wrapped.append(Inst(".macro.measurement_start:", 8, 0, 0))
        wrapped.extend(instructions)
        wrapped.append(Inst(".macro.measurement_end:", 8, 0, 0))
        wrapped.append(Inst(".test_case_exit:nop", 1, 0, 0))
        return wrapped

    def _wrap_instructions_for_uc(self, instructions: List[Inst]) -> List[Inst]:
        """
        Unicorn test cases have measurement_end macro inserted automatically.
        """
        wrapped = []
        wrapped.extend(instructions)
        wrapped.append(Inst(".macro.measurement_end:", 8, 0, 0))
        wrapped.append(Inst(".test_case_exit:nop", 1, 0, 0))
        return wrapped

    def __iter__(self) -> Generator[Inst, None, None]:
        yield from self.instructions

    def __getitem__(self, index: int) -> Inst:
        return self.instructions[index]

    def set_offsets(self, instructions: List[Inst]) -> None:
        """ Set the pc_offset for each instruction in a list """
        pc = self.start_offset
        for inst in instructions:
            inst.pc_offset = pc
            pc += inst.size

    def to_test_case(self) -> TestCaseProgram:
        """Load a test case from the assembly string.

        :return: Parsed TestCaseProgram object
        """
        min_x86_path = test_dir / "min_x86.json"

        asm_str = ASM_HEADER
        asm_str += "\n".join([x.text for x in self.instructions])

        instruction_set = InstructionSet(min_x86_path.absolute().as_posix())
        target_desc = X86TargetDesc()
        elf_parser = ELFParser(target_desc)
        asm_parser = X86AsmParser(instruction_set, target_desc)
        generator = X86Generator(CONF.program_generator_seed, instruction_set, target_desc,
                                 asm_parser, elf_parser)

        # Create temp file and parse
        with tempfile.NamedTemporaryFile(
                mode='w', delete=False, suffix='.asm', encoding='utf-8') as f:
            f.write(asm_str)
            temp_path = f.name

        try:
            tc: TestCaseProgram = asm_parser.parse_file(temp_path, generator, elf_parser)
        finally:
            os.unlink(temp_path)

        return tc

    def get_expected_observations(self, execution_order: List[int], observe_pc: bool,
                                  observe_mem: bool, observe_val: bool) -> List[int]:
        """Get expected observations for executed instructions.

        :param execution_order: List of instruction indices in execution order
        :param observe_pc: Whether to observe program counter values
        :param observe_mem: Whether to observe memory addresses
        :param observe_val: Whether to observe memory values
        :return: List of expected observation values
        """
        adjusted_order = self._adjust_execution_order_for_backend(execution_order)
        return self._collect_observations(adjusted_order, observe_pc, observe_mem, observe_val)

    def _adjust_execution_order_for_backend(self, execution_order: List[int]) -> List[int]:
        last_org_id = len(self.instructions) - 3
        last_actual_id = len(self.instructions) - 1

        if self.backend == "dr":
            return self._adjust_order_for_dr(execution_order, last_org_id, last_actual_id)
        else:  # uc
            return self._adjust_order_for_uc(execution_order, last_org_id, last_actual_id)

    def _adjust_order_for_dr(self, execution_order: List[int], last_org_id: int,
                             last_actual_id: int) -> List[int]:
        """Adjust execution order for DynamoRIO backend.
        DynamoRIO includes measurement_start at the beginning, and appends
        measurement_end + NOP at the end.
        """
        updated_order = [0]  # measurement_start
        for idx in execution_order:
            updated_order.append(idx + 1)
            if idx + 1 == last_org_id:
                updated_order.append(last_actual_id - 1)  # measurement_end
                updated_order.append(last_actual_id)  # NOP at test_case_exit
        return updated_order

    def _adjust_order_for_uc(self, execution_order: List[int], last_org_id: int,
                             last_actual_id: int) -> List[int]:
        """Adjust execution order for Unicorn backend.
        Unicorn appends measurement_end at the end. The NOP is not observed.
        """
        updated_order = []
        for idx in execution_order:
            updated_order.append(idx)
            if idx == last_org_id:
                updated_order.append(last_actual_id - 1)  # measurement_end
                # NOP is not observed on UC
        return updated_order

    def _collect_observations(self, execution_order: List[int], observe_pc: bool, observe_mem: bool,
                              observe_val: bool) -> List[int]:
        """Collect observations based on execution order and observation flags.
        """
        observations = []
        for exec_id in execution_order:
            inst = self.instructions[exec_id]
            if inst.size == 0:  # not an actual instruction
                continue
            if observe_pc:
                observations.append(inst.pc_offset)
            if observe_mem and inst.mem_address != 0:
                observations.append(inst.mem_address)
            if observe_val and inst.mem_value != 0:
                observations.append(inst.mem_value)
        return observations


class InputBuilder:
    """Helper class to create InputData for x86 tests."""

    def get_default_input(self) -> InputData:
        """Create default InputData for x86 tests.

        :return: InputData with default values for memory and registers
        """
        input_ = InputData()
        input_[0]['main'][0] = MEM_DEFAULT_VALUE
        input_[0]['main'][1] = MEM_DEFAULT_VALUE
        input_[0]['faulty'][0] = MEM_FAULTY_DEFAULT_VALUE
        input_[0]['faulty'][1] = MEM_FAULTY_DEFAULT_VALUE
        for i in range(NUM_TEST_GPRS):
            input_[0]['gpr'][i] = REG_DEFAULT_VALUE
        return input_

    def get_input_with_zeroed_gprs(self, *gpr_indices: int) -> InputData:
        """Create InputData with specified GPRs set to 0 for taint tracking.

        :param gpr_indices: Register indices to initialize to 0
        :return: InputData with specified registers set to 0
        """
        input_ = InputData()
        for gpr_idx in gpr_indices:
            input_[0]['gpr'][gpr_idx] = 0
        return input_

    def get_input_with_zeroed_memory(self, **memory_regions: int) -> InputData:
        """Create InputData with specified memory regions set to 0 for taint tracking.

        :param memory_regions: Keyword arguments where key is region name (e.g., 'main', 'faulty')
                              and value is the index within that region
        :return: InputData with specified memory regions set to 0
        """
        input_ = InputData()
        for region, idx in memory_regions.items():
            input_[0][region][idx] = 0
        return input_


================================================
FILE: tests/x86_tests/unit_dr_decoder.py
================================================
"""
File: Collection of unit tests for DynamoRIO backend adaptor.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=too-many-arguments
# pylint: disable=too-few-public-methods
# pylint: disable=too-many-public-methods
# pylint: disable=protected-access
# pylint: disable=missing-function-docstring

import unittest
import struct
import os
# from unittest.mock import MagicMock
from tempfile import NamedTemporaryFile
from typing import Any, List, Dict

from rvzr.model_dynamorio.trace_decoder import TraceDecoder, TraceEntryType
from rvzr.model_dynamorio.trace_decoder import DebugTraceEntryType

# ------------------------------------------------------------------------------
# Leakage trace representation
# ------------------------------------------------------------------------------
# Content of the test trace
TEST_TRACE: List[Dict[str, Any]] = [
    {
        "addr": 0x0,
        "size": 8,
        "type": TraceEntryType.ENTRY_PC.value
    },
    {
        "addr": 0xdeadbeef,
        "size": 4,
        "type": TraceEntryType.ENTRY_READ.value
    },
    {
        "addr": 0xcafecafe,
        "size": 8,
        "type": TraceEntryType.ENTRY_WRITE.value
    },
    {
        "addr": 11,
        "size": 0,
        "type": TraceEntryType.ENTRY_EXCEPTION.value
    },
    {
        "addr": 0x0,
        "size": 0x0,
        "type": TraceEntryType.ENTRY_EOT.value
    },
]
# Format string to parse a trace entry
TRACE_FMT = "<QIBxxx"

# ------------------------------------------------------------------------------
# Debug trace representation
# ------------------------------------------------------------------------------
# Contents of the debug test trace
TEST_DBG_TRACE: List[Dict[str, Any]] = [
    {
        "type": DebugTraceEntryType.ENTRY_REG_DUMP.value,
        "spec": 0,
        "xax": 0xaaaaaaaa,
        "xbx": 0xbbbbbbbb,
        "xcx": 0xcccccccc,
        "xdx": 0xdddddddd,
        "xsi": 0xeeeeeeee,
        "xdi": 0xffffffff,
        "pc": 0xdeadbeef,
    },
    {
        "type": DebugTraceEntryType.ENTRY_LOC.value,
        "spec": 0,
        "offset": 0xABCD,
        "module_name": "/usr/lib/test.so" + ("\x00" * 32),
    },
    {
        "type": DebugTraceEntryType.ENTRY_READ.value,
        "spec": 0,
        "address": 0xcafecafe,
        "value": 0xabababab,
        "size": 0xf,
    },
    {
        "type": DebugTraceEntryType.ENTRY_WRITE.value,
        "spec": 0,
        "address": 0xcdcdcdcd,
        "value": 0xcafecafe,
        "size": 8,
    },
    {
        "type": DebugTraceEntryType.ENTRY_CHECKPOINT.value,
        "spec": 1,
        "rollback_pc": 0xdeadbeef,
        "cur_window_size": 1,
        "cur_store_log_size": 1,
    },
    {
        "type": DebugTraceEntryType.ENTRY_ROLLBACK_STORE.value,
        "spec": 1,
        "addr": 0xcdcdcdcd,
        "val": 0xcafecafe,
        "size": 0xf,
        "nesting_level": 1,
    },
    {
        "type": DebugTraceEntryType.ENTRY_ROLLBACK.value,
        "spec": 1,
        "nesting": 1,
        "rollback_pc": 0xdeadbeef,
    },
    {
        "type": DebugTraceEntryType.ENTRY_EXCEPTION.value,
        "spec": 0,
        "signal": 11,
        "address": 0xcdcdcdcd,
    },
    {
        "type": DebugTraceEntryType.ENTRY_EOT.value,
        "spec": 0,
    },
]
# Shared fields for debug entries
DBG_TRACE_PREFIX = '<BB' + ('x' * 6)
# Fields specific to each entry type
DBG_TRACE_FMT = {
    DebugTraceEntryType.ENTRY_EOT: DBG_TRACE_PREFIX,
    DebugTraceEntryType.ENTRY_REG_DUMP: DBG_TRACE_PREFIX + ('Q' * 7),
    DebugTraceEntryType.ENTRY_READ: DBG_TRACE_PREFIX + 'QQQ',
    DebugTraceEntryType.ENTRY_WRITE: DBG_TRACE_PREFIX + 'QQQ',
    DebugTraceEntryType.ENTRY_LOC: DBG_TRACE_PREFIX + 'Q' + ('c' * 48),
    DebugTraceEntryType.ENTRY_EXCEPTION: DBG_TRACE_PREFIX + 'ixxxxQ',
    DebugTraceEntryType.ENTRY_CHECKPOINT: DBG_TRACE_PREFIX + 'QQI',
    DebugTraceEntryType.ENTRY_ROLLBACK: DBG_TRACE_PREFIX + 'IxxxxQ',
    DebugTraceEntryType.ENTRY_ROLLBACK_STORE: DBG_TRACE_PREFIX + 'QQIxxxxQ',
}

# ------------------------------------------------------------------------------
# Testsuite
# ------------------------------------------------------------------------------


class DRTraceDecodeTest(unittest.TestCase):
    """
    Suite of tests for the DR trace decoder
    """

    # --------------------------------------------------------------------------
    # Helpers
    # --------------------------------------------------------------------------
    def _find_entry_of_type(self, t: TraceEntryType) -> dict[str, Any]:
        for e in TEST_TRACE:
            if e["type"] == t.value:
                return e

        raise ValueError(f"No entry for type {t}")

    def _encode_from_dict(self, entry: dict[str, Any]) -> bytes:
        return struct.pack(TRACE_FMT, entry["addr"], entry["size"], entry["type"])

    def _check_trace_equivalence(self, expected: dict[str, Any], decoded: Any) -> None:
        self.assertEqual(expected["addr"], decoded.addr)
        self.assertEqual(expected["size"], decoded.size)
        self.assertEqual(expected["type"], TraceEntryType(decoded.type).value)

    # --------------------------------------------------------------------------
    # Test cases
    # --------------------------------------------------------------------------
    def test_trace_decoding(self) -> None:
        decoder = TraceDecoder()

        # Encode the special marker
        packed_trace = struct.pack("c", "T".encode('utf-8'))
        packed_trace += b'\x00' * 7  # Padding to ensure the marker is 8 bytes long

        # Encode all entries
        for test_entry in TEST_TRACE:
            packed_trace += self._encode_from_dict(test_entry)

        with NamedTemporaryFile("wb", delete=False) as f:
            # Write encoded entries to file
            f.write(packed_trace)
            f.close()
            # Decode the file
            parsed_traces = decoder.decode_trace_file(f.name)
            self.assertEqual(len(parsed_traces), 1)
            # Check decoded entries
            for idx, decoded in enumerate(parsed_traces[0]):
                self._check_trace_equivalence(TEST_TRACE[idx], decoded)

    def test_is_corrupted(self) -> None:
        decoder = TraceDecoder()

        # Encode the special marker
        marker = struct.pack("c", "T".encode('utf-8'))
        marker += b'\x00' * 7  # Padding to ensure the marker is 8 bytes long
        pc = self._encode_from_dict(self._find_entry_of_type(TraceEntryType.ENTRY_PC))
        xcpt = self._encode_from_dict(self._find_entry_of_type(TraceEntryType.ENTRY_EXCEPTION))
        eot = self._encode_from_dict(self._find_entry_of_type(TraceEntryType.ENTRY_EOT))

        # Only EOT is valid at the end of the trace
        traces = [(pc, True), (pc + xcpt, True), (pc + eot, False), (pc + xcpt + eot, False)]

        for t in traces:
            with NamedTemporaryFile("wb", delete=False) as f:
                # Write encoded entries to file
                f.write(marker + t[0])

            # Decode the file
            if t[1]:
                with self.assertRaises(ValueError):
                    decoder.decode_trace_file(f.name)
            else:
                parsed_traces = decoder.decode_trace_file(f.name)
                self.assertEqual(len(parsed_traces), 1)

            os.remove(f.name)


class DRDebugTraceDecodeTest(unittest.TestCase):
    """
    Suite of tests for the DR trace decoder for debug traces
    """

    # --------------------------------------------------------------------------
    # Helpers
    # --------------------------------------------------------------------------
    def _find_entry_of_type(self, t: DebugTraceEntryType) -> dict[str, Any]:
        for e in TEST_DBG_TRACE:
            if e["type"] == t.value:
                return e

        raise ValueError(f"No debug entry for type {t}")

    def _encode_from_dict(self, entry: dict[str, Any]) -> bytes:
        # Get format string depending on the entry type
        fmt = DBG_TRACE_FMT[DebugTraceEntryType(entry["type"])]
        # Add padding if needed
        if struct.calcsize(fmt) < 64:
            fmt += 'x' * (64 - struct.calcsize(fmt))

        # Get the values to encode
        vals = list(entry.values())
        to_pack = []
        for v in vals:
            if isinstance(v, str):
                # Encode strings as char arrays
                to_pack.extend([x.encode('utf-8') for x in list(v)])
            else:
                # Otherwise just use the value in the map
                to_pack.append(v)

        return struct.pack(fmt, *to_pack)

    def _check_dbg_trace_equivalence(self, expected: dict[str, Any], decoded: Any) -> None:
        type_ = DebugTraceEntryType(decoded.type)

        if type_ == DebugTraceEntryType.ENTRY_REG_DUMP:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["xax"], decoded.regs.xax)
            self.assertEqual(expected["xbx"], decoded.regs.xbx)
            self.assertEqual(expected["xcx"], decoded.regs.xcx)
            self.assertEqual(expected["xdx"], decoded.regs.xdx)
            self.assertEqual(expected["xsi"], decoded.regs.xsi)
            self.assertEqual(expected["xdi"], decoded.regs.xdi)
            self.assertEqual(expected["pc"], decoded.regs.pc)
        elif type_ == DebugTraceEntryType.ENTRY_LOC:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["offset"], decoded.loc.offset)
            self.assertEqual(expected["module_name"],
                             (b''.join(decoded.loc.module_name)).decode('utf-8'))
        elif type_ == DebugTraceEntryType.ENTRY_READ:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["address"], decoded.mem.address)
            self.assertEqual(expected["value"], decoded.mem.value)
            self.assertEqual(expected["size"], decoded.mem.size)
        elif type_ == DebugTraceEntryType.ENTRY_WRITE:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["address"], decoded.mem.address)
            self.assertEqual(expected["value"], decoded.mem.value)
            self.assertEqual(expected["size"], decoded.mem.size)
        elif type_ == DebugTraceEntryType.ENTRY_CHECKPOINT:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["rollback_pc"], decoded.checkpoint.rollback_pc)
            self.assertEqual(expected["cur_window_size"], decoded.checkpoint.cur_window_size)
            self.assertEqual(expected["cur_store_log_size"], decoded.checkpoint.cur_store_log_size)
        elif type_ == DebugTraceEntryType.ENTRY_ROLLBACK_STORE:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["addr"], decoded.rollback_store.addr)
            self.assertEqual(expected["val"], decoded.rollback_store.val)
            self.assertEqual(expected["size"], decoded.rollback_store.size)
            self.assertEqual(expected["nesting_level"], decoded.rollback_store.nesting_level)
        elif type_ == DebugTraceEntryType.ENTRY_ROLLBACK:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["nesting"], decoded.rollback.nesting)
            self.assertEqual(expected["rollback_pc"], decoded.rollback.rollback_pc)
        elif type_ == DebugTraceEntryType.ENTRY_EXCEPTION:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
            self.assertEqual(expected["signal"], decoded.xcpt.signal)
            self.assertEqual(expected["address"], decoded.xcpt.address)
        elif type_ == DebugTraceEntryType.ENTRY_EOT:
            self.assertEqual(expected["type"], type_.value)
            self.assertEqual(expected["spec"], decoded.nesting_level)
        else:
            raise ValueError("Unknown debug trace type")

    # --------------------------------------------------------------------------
    # Test cases
    # --------------------------------------------------------------------------
    def test_debug_entry_decoding(self) -> None:
        decoder = TraceDecoder()

        for original in TEST_DBG_TRACE:
            # Encode entry to a bytes array
            encoded = self._encode_from_dict(original)
            # Decode it as an object
            decoded = decoder._decode_debug_trace_entry(encoded)
            # Test the decoded output
            self._check_dbg_trace_equivalence(original, decoded)

    def test_debug_trace_decoding(self) -> None:
        decoder = TraceDecoder()

        # Encode the special marker
        packed_trace = struct.pack("c", "D".encode('utf-8'))
        packed_trace += b'\x00' * 7  # Padding to ensure the marker is 8 bytes long

        # Encode all entries
        for test_entry in TEST_DBG_TRACE:
            packed_trace += self._encode_from_dict(test_entry)

        with NamedTemporaryFile("wb", delete=False) as f:
            # Write encoded entries to a file
            f.write(packed_trace)
            f.close()
            # Decode the file
            parsed_dbg_traces = decoder.decode_debug_trace_file(f.name)
            self.assertEqual(len(parsed_dbg_traces), 1)
            # Check decoded entries
            for idx, decoded in enumerate(parsed_dbg_traces[0]):
                self._check_dbg_trace_equivalence(TEST_DBG_TRACE[idx], decoded)

    def test_is_corrupted(self) -> None:
        decoder = TraceDecoder()

        # Encode the special marker
        marker = struct.pack("c", "D".encode('utf-8'))
        marker += b'\x00' * 7  # Padding to ensure the marker is 8 bytes long
        pc = self._encode_from_dict(self._find_entry_of_type(DebugTraceEntryType.ENTRY_REG_DUMP))
        xcpt = self._encode_from_dict(self._find_entry_of_type(DebugTraceEntryType.ENTRY_EXCEPTION))
        eot = self._encode_from_dict(self._find_entry_of_type(DebugTraceEntryType.ENTRY_EOT))

        # Only EOT is valid at the end of the trace
        traces = [(pc, True), (pc + xcpt, True), (pc + eot, False), (pc + xcpt + eot, False)]

        for t in traces:
            with NamedTemporaryFile("wb", delete=False) as f:
                # Write encoded entries to file
                f.write(marker + t[0])

            # Decode the file
            if t[1]:
                with self.assertRaises(ValueError):
                    decoder.decode_debug_trace_file(f.name)
            else:
                parsed_traces = decoder.decode_debug_trace_file(f.name)
                self.assertEqual(len(parsed_traces), 1)

            os.remove(f.name)


================================================
FILE: tests/x86_tests/unit_fuzzer.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring
# pylint: disable=missing-class-docstring
# pylint: disable=protected-access

import os
import unittest
import tempfile
from pathlib import Path

from rvzr.factory import get_asm_parser, get_program_generator
from rvzr.elf_parser import ELFParser
from rvzr.isa_spec import InstructionSet
from rvzr.config import CONF
from rvzr.logs import update_logging_after_config_change
from rvzr.arch.x86.target_desc import X86TargetDesc
from rvzr.arch.x86.fuzzer import _create_fenced_test_case

CONF.instruction_set = "x86-64"
test_path = Path(__file__).resolve()
test_dir = test_path.parent


# ==================================================================================================
# Tests
# ==================================================================================================
class X86FuzzerTest(unittest.TestCase):

    @classmethod
    def setUpClass(cls) -> None:
        CONF.logging_modes = []
        update_logging_after_config_change()

    def test__create_fenced_test_case(self) -> None:
        # Test that the function _create_fenced_test_case adds fences to
        # the assembly file in a correct way

        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(X86TargetDesc())

        # original_asm = "test.asm"
        # fenced_asm = "fenced_test.asm"
        with tempfile.NamedTemporaryFile(delete=False) as original:
            original_asm = original.name
        with tempfile.NamedTemporaryFile(delete=False) as fenced:
            fenced_asm = fenced.name

        with open(original_asm, 'w') as f:
            f.write("""
            .intel_syntax noprefix
            .section .data.main
            .function_1:
            .macro.measurement_start:

            # This is a comment
            .byte 0x90

            jne .l1
            loopne .l1
            .l1:
            adc rax, rbx
            cmp rbx, rcx

            .test_case_exit:
            """)

        _ = _create_fenced_test_case(original_asm, fenced_asm, asm_parser, generator, elf_parser)
        fenced_lines = []
        with open(fenced_asm, 'r') as f:
            for line in f:
                fenced_lines.append(line.strip())

        # clean up
        os.unlink(original_asm)
        os.unlink(fenced_asm)

        # Check that the fences are placed in expected places
        self.assertIn("lfence", fenced_lines[8])
        self.assertIn("lfence", fenced_lines[13])
        self.assertIn("lfence", fenced_lines[15])
        self.assertIn("lfence", fenced_lines[17])


if __name__ == '__main__':
    unittest.main()


================================================
FILE: tests/x86_tests/unit_generators.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring
# pylint: disable=missing-class-docstring

import unittest
import tempfile
import subprocess
import os
from pathlib import Path
from copy import deepcopy

from rvzr.arch.x86.generator import X86Generator, _X86Printer, _X86PatchUndefinedFlagsPass
from rvzr.arch.x86.target_desc import X86TargetDesc
from rvzr.elf_parser import ELFParser
from rvzr.factory import get_program_generator, get_asm_parser
from rvzr.isa_spec import InstructionSet
from rvzr.tc_components.actor import ActorMode
from rvzr.tc_components.test_case_code import TestCaseProgram, Function, BasicBlock
from rvzr.tc_components.test_case_binary import SymbolTableEntry
from rvzr.code_generator import assemble
from rvzr.config import CONF
from rvzr.logs import update_logging_after_config_change

CONF.instruction_set = "x86-64"
test_path = Path(__file__).resolve()
test_dir = test_path.parent

ASM_OPCODE = """
.intel_syntax noprefix
.section .data.main
.byte 0x90
.test_case_exit:
"""

_ALL_CATEGORIES = [
    "3DNOW_PREFETCH-PREFETCH", "ADOX_ADCX-ADOX_ADCX", "BASE-BINARY", "BASE-BITBYTE", "BASE-CMOV",
    "BASE-COND_BR", "BASE-CONVERT", "BASE-DATAXFER", "BASE-FLAGOP", "BASE-LOGICAL", "BASE-MISC",
    "BASE-NOP", "BASE-POP", "BASE-PUSH", "BASE-ROTATE", "BASE-SEMAPHORE", "BASE-SETCC",
    "BASE-SHIFT", "BASE-WIDENOP", "LONGMODE-CONVERT", "LONGMODE-DATAXFER", "LONGMODE-POP",
    "LONGMODE-PUSH", "LONGMODE-SEMAPHORE", "MMX-MMX", "MMX-LOGICAL", "MMX-DATAXFER", "SSE2-MMX",
    "SSE3-MMX", "SSSE3-MMX", "SSE-CONVERT", "SSE-DATAXFER", "SSE-MISC", "SSE-PREFETCH", "SSE-SSE",
    "SSE2-CONVERT", "SSE2-DATAXFER", "SSE2-LOGICAL", "SSE2-MISC", "SSE2-SSE", "SSE3-DATAXFER",
    "SSE3-SSE", "SSSE3-SSE", "SSE4-LOGICAL", "SSE4-SSE", "AVX-AVX", "AVX-BROADCAST", "AVX-DATAXFER",
    "AVX-LOGICAL", "AVX-STTNI", "AVX2-AVX2", "AVX2-BROADCAST", "AVX2-DATAXFER", "AVX2-LOGICAL",
    "AES-AES", "AVXAES-AES", "BMI1-BMI1", "BMI2-BMI2", "MOVBE-DATAXFER", "LZCNT-LZCNT",
    "PCLMULQDQ-PCLMULQDQ", "VAES-VAES", "3DNOW-3DNOW", "VPCLMULQDQ-VPCLMULQDQ", "SHA-SHA",
    "SSE4a-BITBYTE", "FMA-VFMA", "MOVDIR-MOVDIR", "GFNI-GFNI", "FMA4-FMA4", "AVX_VNNI-VEX",
    "3DNOW-MMX", "LONGMODE-RET", "BASE-RET", "BASE-CALL", "BASE-UNCOND_BR", "SSE-LOGICAL_FP",
    "AVX-LOGICAL_FP", "SSE2-LOGICAL_FP", "AVX2GATHER-AVX2GATHER", "BASE-STRINGOP",
    "LONGMODE-STRINGOP", "CLDEMOTE-CLDEMOTE", "CLFLUSHOPT-CLFLUSHOPT", "CLFSH-MISC", "CLWB-CLWB",
    "CLZERO-CLZERO", "PREFETCHWT1-PREFETCHWT1", "SERIALIZE-SERIALIZE", "BASE-SYSCALL",
    "BASE-SYSRET", "BASE-SEGOP", "BASE-INTERRUPT", "LONGMODE-SYSRET", "PKU-PKU", "PCONFIG-PCONFIG",
    "BASE-IO", "BASE-IOSTRINGOP", "LONGMODE-SYSCALL", "RDPRU-RDPRU", "RDPID-RDPID", "SMAP-SMAP",
    "UINTR-UINTR, MCOMMIT-MISC", "PTWRITE-PTWRITE", "TBM-TBM", "AVX512EVEX-LOGICAL",
    "AVX512EVEX-GFNI", "AVX512EVEX-EXPAND", "AVX512EVEX-DATAXFER", "AVX512EVEX-VFMA",
    "AVX512EVEX-LOGICAL_FP", "AVX512EVEX-VBMI2", "AVX512EVEX-IFMA", "AVX512EVEX-FP16",
    "AVX512EVEX-BROADCAST", "AVX512EVEX-COMPRESS", "AVX512EVEX-AVX512_VBMI", "AVX512EVEX-CONFLICT",
    "AVX512EVEX-VAES", "AVX512EVEX-VPCLMULQDQ", "AVX512EVEX-AVX512", "AVX512EVEX-BLEND",
    "AVX512EVEX-CONVERT", "AVX512EVEX-AVX512_4FMAPS", "RDRAND-RDRAND", "RDSEED-RDSEED"
]


class X86GeneratorTest(unittest.TestCase):

    @classmethod
    def setUpClass(cls) -> None:
        CONF.logging_modes = []
        update_logging_after_config_change()

    @staticmethod
    def load_tc(asm_str: str) -> TestCaseProgram:

        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(X86TargetDesc())

        asm_file = tempfile.NamedTemporaryFile(delete=False)
        with open(asm_file.name, "w") as f:
            f.write(asm_str)
        tc: TestCaseProgram = asm_parser.parse_file(asm_file.name, generator, elf_parser)
        asm_file.close()
        os.unlink(asm_file.name)
        return tc

    def test_x86_configuration(self) -> None:
        CONF.generator = "random"
        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix(),
                                         CONF.instruction_categories)
        gen = get_program_generator(CONF.program_generator_seed, instruction_set)
        self.assertEqual(gen.__class__, X86Generator)

    def _test_all_instructions(self, instruction_set: InstructionSet) -> None:
        # pylint: disable=protected-access
        # Note: This function tests internals of the generator, which is why we
        # have to disable the protected-access warning.

        asm_file = tempfile.NamedTemporaryFile("w", delete=False)
        obj_file = tempfile.NamedTemporaryFile("w", delete=False)

        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        function_generator = generator._function_generator
        tc = TestCaseProgram(asm_file.name)
        tc.assign_obj(obj_file.name)

        func = function_generator.generate_empty(".function_0", tc.find_section(name="main"))
        printer = _X86Printer(X86TargetDesc())
        all_instructions = ['.intel_syntax noprefix\n']

        # try generating instruction strings
        for bb in func:
            for instruction_spec in instruction_set.non_control_flow_specs:
                # fill up with random operand, following the spec
                inst = generator.generate_instruction(instruction_spec)
                bb.insert_after(bb.get_last(), inst)

            for instr in bb:
                instr_str = printer._instruction_to_str(instr)
                self.assertTrue(instr_str, f'Instruction {instr} was not generated.')
                all_instructions.append(instr_str + "\n")

        for i in all_instructions:
            asm_file.write(i)

        # check if the generated instructions are valid
        assembly_failed = False
        try:
            assemble(tc)
        except subprocess.CalledProcessError:
            assembly_failed = True
        else:
            obj_file.close()
            os.unlink(obj_file.name)
        asm_file.close()
        os.unlink(asm_file.name)

        if assembly_failed:
            self.fail("Generated invalid instruction(s)")

    def test_x86_all_instructions_reduced(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix(),
                                         _ALL_CATEGORIES)
        self._test_all_instructions(instruction_set)

    def test_x86_all_instructions_full(self) -> None:
        if not (test_dir / "../../base.json").exists():
            self.skipTest("base.json not available; skipping test.")

        instruction_set = InstructionSet((test_dir / "../../base.json").absolute().as_posix(),
                                         _ALL_CATEGORIES)
        self._test_all_instructions(instruction_set)

    def test_x86_asm_parsing_basic(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(X86TargetDesc())

        asm_name = (test_dir / "asm/asm_basic.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(asm_name, generator, elf_parser)
        section = tc[0]
        functions = list(section)

        self.assertEqual(len(functions), 2)

        main = functions[0]
        self.assertEqual(main.name, ".function_0")

        self.assertEqual(len(main), 3)

        bb0 = main[1]
        bb1 = main[2]
        exit_ = main.get_exit_bb()

        self.assertEqual(bb0.successors[0], bb1)
        self.assertEqual(bb1.successors[0], exit_)

        self.assertEqual(functions[1].name, ".function_end")

    def test_x86_asm_parsing_opcode(self) -> None:

        tc = self.load_tc(ASM_OPCODE)
        functions = list(tc[0])

        main_iter = iter(functions[0])
        bb0 = next(main_iter)
        insts = list(bb0)
        self.assertEqual(insts[0].name, "macro")
        self.assertEqual(insts[1].name, "opcode")

    def test_x86_asm_parsing_section(self) -> None:
        prev_actors = deepcopy(CONF.get_actors_conf())
        CONF.get_actors_conf()["guest_1"] = deepcopy(CONF._actor_default)
        CONF.get_actors_conf()["guest_1"]["name"] = "guest_1"
        CONF.get_actors_conf()["guest_1"]["mode"] = "guest"
        CONF.get_actors_conf()["guest_1"]["privilege_level"] = "kernel"

        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix())
        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(X86TargetDesc())
        name = (test_dir / "asm/asm_multiactor.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(name, generator, elf_parser)

        self.assertEqual(tc.n_actors(), 2)
        self.assertEqual(tc.find_actor(name="main").mode, ActorMode.HOST)
        self.assertEqual(tc.find_actor(name="main").get_id(), 0)
        self.assertEqual(tc.find_actor(name="guest_1").mode, ActorMode.GUEST)
        self.assertEqual(tc.find_actor(name="guest_1").get_id(), 1)

        self.assertEqual(len(tc), 2)

        sec1 = tc[0]
        self.assertEqual(len(sec1), 3)
        self.assertEqual(sec1.owner.get_id(), 0)
        self.assertTrue(sec1.owner.is_main)

        f1 = sec1[0]
        self.assertEqual(f1.name, ".function_0")
        self.assertEqual(len(f1[0]), 3)

        f2 = sec1[1]
        self.assertEqual(f2.name, ".function_2")
        self.assertEqual(len(f2[0]), 1)

        sec2 = tc[1]
        self.assertEqual(len(sec2), 1)
        self.assertEqual(sec2.owner.get_id(), 1)
        self.assertFalse(sec2.owner.is_main)

        f1 = sec2[0]
        self.assertEqual(f1.name, ".function_1")
        self.assertEqual(len(f1[0]), 1)

        CONF._actors = prev_actors

    def test_x86_asm_parsing_symbols(self) -> None:
        prev_actors = deepcopy(CONF.get_actors_conf())
        CONF.get_actors_conf()["guest_1"] = deepcopy(CONF._actor_default)
        CONF.get_actors_conf()["guest_1"]["name"] = "guest_1"
        CONF.get_actors_conf()["guest_1"]["mode"] = "guest"
        CONF.get_actors_conf()["guest_1"]["privilege_level"] = "kernel"

        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix())

        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        asm_parser = get_asm_parser(instruction_set)
        elf_parser = ELFParser(X86TargetDesc())
        name = (test_dir / "asm/asm_symbol.asm").absolute().as_posix()
        tc: TestCaseProgram = asm_parser.parse_file(name, generator, elf_parser)
        obj = tc.get_obj()
        symbol_table = obj.symbol_table()

        self.assertEqual(symbol_table[0], SymbolTableEntry(0, 0, 0, 0))  # function_0
        self.assertEqual(symbol_table[1], SymbolTableEntry(0, 0, 1, 0))
        self.assertEqual(symbol_table[2], SymbolTableEntry(0, 9, 2, 0))
        self.assertEqual(symbol_table[3], SymbolTableEntry(0, 20, 0, 1))  # function_1
        self.assertEqual(symbol_table[4], SymbolTableEntry(1, 0, 0, 2))  # function_2

        CONF._actors = prev_actors

    def test_x86_undef_flag_patch(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix(),
                                         CONF.instruction_categories + ["BASE-FLAGOP"])
        undef_instr_spec = list(filter(lambda x: x.name == 'bsf', instruction_set.instructions))[0]
        read_instr_spec = list(filter(lambda x: x.name == 'lahf', instruction_set.instructions))[0]

        generator = get_program_generator(CONF.program_generator_seed, instruction_set)
        undef_instr = generator.generate_instruction(undef_instr_spec)
        read_instr = generator.generate_instruction(read_instr_spec)

        test_case = TestCaseProgram("")
        sec = test_case[0]
        func = Function(".function_0", sec)
        sec.append(func)
        bb = BasicBlock(".bb0", func)
        func.append(bb)
        bb.insert_after(bb.get_last(), undef_instr)
        bb.insert_after(bb.get_last(), read_instr)

        _X86PatchUndefinedFlagsPass(instruction_set, generator).run_on_test_case(test_case)
        self.assertEqual(len(bb), 3)


================================================
FILE: tests/x86_tests/unit_isa_loader.py
================================================
"""
Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
import unittest
from pathlib import Path

from rvzr.isa_spec import InstructionSet
from rvzr.config import CONF

test_path = Path(__file__).resolve()
test_dir = test_path.parent
CONF.instruction_set = "x86-64"


class x86ISALoaderTest(unittest.TestCase):

    def test_instruction_filtering(self) -> None:
        instruction_set = InstructionSet((test_dir / "min_x86.json").absolute().as_posix(),
                                         ["BASE-BINARY"])
        inst_names = [i.name for i in instruction_set.instructions]
        self.assertNotIn("HLT", inst_names)


================================================
FILE: tests/x86_tests/unit_model.py
================================================
"""
File: Collection of unit tests for x86 model backends.

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=too-many-arguments
# pylint: disable=too-few-public-methods
# pylint: disable=too-many-public-methods
# pylint: disable=protected-access
# pylint: disable=missing-function-docstring

import unittest
from typing import Callable, List, Optional, Tuple, Union, Any, Dict
from copy import deepcopy
from pathlib import Path
from functools import wraps

from rvzr.model_dynamorio.model import DynamoRIOModel
from rvzr.model_unicorn.model import X86UnicornModel

from rvzr.tc_components.test_case_data import InputData
from rvzr.traces import CTrace
from rvzr.factory import get_model
from rvzr.config import CONF, ConfigException, Conf
from rvzr.logs import update_logging_after_config_change

from .model_common import Inst, InstList, InputBuilder, \
    MAIN_OFFSET, FAULTY_OFFSET, MEM_DEFAULT_VALUE, \
    REG_DEFAULT_VALUE, MEM_FAULTY_DEFAULT_VALUE, RSP_DEFAULT_VALUE, CODE_BASE, DATA_BASE, Backend, \
    RAX, RBX, RCX, RDX, RSI, RDI

ModelType = Union[DynamoRIOModel, X86UnicornModel]

TEST_PATH = Path(__file__).resolve()
TEST_DIR = TEST_PATH.parent

PF_MASK = 0xfffffffffffffffe

# Test values
TEST_MEM_VALUE_A = 42
TEST_MEM_VALUE_B = 0x42
POISON_VALUE = 0xDEADBEEF


def skip_for_backend(backend: Backend, reason: str = "not supported") -> Callable[[Any], Any]:
    """Decorator to skip tests for specific backends.

    :param backend: Backend to skip ('dr' or 'uc')
    :param reason: Reason for skipping (default: "not supported")

    Usage:
        @skip_for_backend("dr")
        def test_something(self):
            ...
    """

    def decorator(test_func: Callable[[Any], Any]) -> Callable[[Any], Any]:

        @wraps(test_func)
        def wrapper(self: '_SharedX86Model') -> Any:
            if self._backend == backend:
                raise unittest.SkipTest(reason)
            return test_func(self)

        return wrapper

    return decorator


class _SharedX86Model(unittest.TestCase):
    """Base class with common test infrastructure for x86 model backends."""

    _prev_obs_clause: Optional[str] = None
    _prev_exec_clause: Optional[List[str]] = None
    _prev_backend: Optional[str] = None
    _prev_conf: Optional[Conf] = None
    _backend: Backend
    _backend_long: str

    # Exclude this parent class from test discovery
    @classmethod
    def setUpClass(cls) -> None:
        if cls is _SharedX86Model:
            raise unittest.SkipTest("Skipping base class")

    @classmethod
    def _configure_class(cls,
                         backend_long: str,
                         additional_config: Optional[Dict[str, Any]] = None) -> None:
        """Configure test class with backend-specific settings.

        :param backend_long: Full backend name ('dynamorio' or 'unicorn')
        :param additional_config: Optional dict of additional CONF attributes to set
        """
        cls._prev_conf = deepcopy(CONF)
        CONF.model_backend = backend_long
        CONF._no_generation = True
        CONF.logging_modes = []

        # Apply additional backend-specific configuration
        if additional_config:
            for attr, value in additional_config.items():
                setattr(CONF, attr, value)

        update_logging_after_config_change()

    @classmethod
    def _teardown_class(cls) -> None:
        """Restore configuration to pre-test state."""
        if cls._prev_conf is not None:
            for attr, value in cls._prev_conf.__dict__.items():
                setattr(CONF, attr, value)

    def __init__(self, methodName: str = "runTest") -> None:
        super().__init__(methodName)
        self._input_builder = InputBuilder()

    def setUp(self) -> None:
        """Save configuration state before each test to prevent leakage between tests."""
        self._save_conf()

    def tearDown(self) -> None:
        """Restore configuration state after each test."""
        self._restore_conf()

    @staticmethod
    def _get_default_ct_trace() -> List[int]:
        """Get default CT trace (empty for base)."""
        trace: List[int] = []
        return trace

    def _save_conf(self) -> None:
        self._prev_obs_clause = CONF.contract_observation_clause
        self._prev_exec_clause = CONF.contract_execution_clause
        self._prev_backend = CONF.model_backend

    def _restore_conf(self) -> None:
        assert self._prev_obs_clause is not None and \
               self._prev_exec_clause is not None and \
               self._prev_backend is not None
        CONF.contract_observation_clause = self._prev_obs_clause
        CONF.contract_execution_clause = self._prev_exec_clause
        CONF.model_backend = self._prev_backend

    def _get_model(self,
                   obs_clause: str,
                   exec_clause: List[str],
                   data_bases: Tuple[int, int],
                   enable_mismatch_check: bool = False) -> ModelType:
        raise NotImplementedError()

    def _get_trace(self,
                   test_case: InstList,
                   input_data: List[InputData],
                   obs_clause: str = "ct",
                   exec_clause: Optional[List[str]] = None,
                   data_bases: Tuple[int, int] = (DATA_BASE, CODE_BASE),
                   nesting: int = 1,
                   enable_mismatch_check: bool = False,
                   pte_mask: int = 0) -> List[CTrace]:
        if exec_clause is None:
            exec_clause = ["seq"]

        model = self._get_model(obs_clause, exec_clause, data_bases, enable_mismatch_check)
        tc = test_case.to_test_case()
        if pte_mask != 0:
            tc.find_actor(name="main").data_properties &= pte_mask  # type: ignore
        model.load_test_case(tc)
        ctraces = model.trace_test_case(input_data, nesting=nesting)
        return ctraces

    def test_no_trace(self) -> None:
        # Test that tracing with no inputs returns an empty list
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
            ],
            backend=self._backend,
        )
        input_data: List[InputData] = []
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=input_data,
        )
        self.assertEqual(len(ctraces), 0)

    def test_mismatch_check_mode(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = InputData()
        input_[0]['gpr'][RAX] = 1
        input_[0]['gpr'][RBX] = 2
        input_[0]['gpr'][RCX] = 3
        input_[0]['gpr'][RDX] = 4
        input_[0]['gpr'][RSI] = 5
        input_[0]['gpr'][RDI] = 6

        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            enable_mismatch_check=True,
        )

        reg_values = ctraces[0].get_untyped()
        self.assertEqual(len(reg_values), 6)
        self.assertEqual(reg_values[0], 0)
        self.assertEqual(reg_values[1], 2)
        self.assertEqual(reg_values[2], 3)
        self.assertEqual(reg_values[3], 4)
        self.assertEqual(reg_values[4], 5)
        self.assertEqual(reg_values[5], 6)

    def test_mismatch_check_mode_2(self) -> None:
        test_case = InstList(
            [
                Inst("mov qword ptr [r14], 42", 3, MAIN_OFFSET + 0, TEST_MEM_VALUE_A),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, TEST_MEM_VALUE_A),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()

        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            enable_mismatch_check=True,
        )

        reg_values = ctraces[0].get_untyped()
        self.assertEqual(len(reg_values), 6)
        self.assertEqual(reg_values[0], test_case[1].mem_value)
        self.assertEqual(reg_values[1], REG_DEFAULT_VALUE)
        self.assertEqual(reg_values[2], REG_DEFAULT_VALUE)
        self.assertEqual(reg_values[3], REG_DEFAULT_VALUE)
        self.assertEqual(reg_values[4], REG_DEFAULT_VALUE)
        self.assertEqual(reg_values[5], REG_DEFAULT_VALUE)

    @skip_for_backend("dr")
    def test_l1d_seq(self) -> None:
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            obs_clause="l1d",
        )

        expected_trace = test_case.get_expected_observations([0], False, True, False)
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)
        self.assertEqual(str(ctraces[0]), "^" + "." * 63)

    def test_ct_seq(self) -> None:
        # Test that the tracing functions create RDBF and RCBF files
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst(".l1:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
        )
        expected_trace = test_case.get_expected_observations([0, 1, 4], True, True, False)
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    def test_checkpoint_rollback_registers(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst(".l1:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = InputData()
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            exec_clause=["cond"],
            enable_mismatch_check=True)
        reg_values = ctraces[0].get_untyped()
        self.assertEqual(len(reg_values), 6)
        self.assertEqual(reg_values[0], 0)

    def test_checkpoint_rollback_memory(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov qword ptr [r14], 1", 7, MAIN_OFFSET + 0, 1),
                Inst(".l1:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
            ],
            backend=self._backend,
        )
        input_ = InputData()
        input_[0]['main'][0] = TEST_MEM_VALUE_B
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            exec_clause=["cond"],
            enable_mismatch_check=True)
        reg_values = ctraces[0].get_untyped()
        self.assertEqual(len(reg_values), 6)
        self.assertEqual(reg_values[0], TEST_MEM_VALUE_B)

    def test_checkpoint_rollback_nested(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),  # 8
                Inst("jz .l2", 2, 0, 0),  # 11 0xb
                Inst(".l0:", 0, 0, 0),  # 13
                Inst("mov qword ptr [r14], 1", 7, MAIN_OFFSET + 0, 1),  # 13  0xd
                Inst("jz .l2", 2, 0, 0),  # 20 0x14
                Inst(".l1:", 0, 0, 0),  # 22 0x16
                Inst("mov qword ptr [r14], 2", 7, MAIN_OFFSET + 0, 1),  # 22 0x16
                Inst("mov rbx, 1", 7, 0, 0),  # 29  0x1d
                Inst(".l2:", 0, 0, 0),  # 36  0x24
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),  # 36
            ],
            backend=self._backend,
        )
        input_ = InputData()
        input_[0]['main'][0] = TEST_MEM_VALUE_B
        input_[0]['gpr'][RBX] = 0x1
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            exec_clause=["cond"],
            nesting=2,
            enable_mismatch_check=True)

        reg_values = ctraces[0].get_untyped()
        self.assertEqual(len(reg_values), 6)
        self.assertEqual(reg_values[0], TEST_MEM_VALUE_B)
        self.assertEqual(reg_values[1], 1)

    def test_ct_cond(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),  # 8
                Inst("jz .l2", 2, 0, 0),  # 11 0xb
                Inst(".l0:", 0, 0, 0),  # 13
                Inst("mov qword ptr [r14], 1", 7, MAIN_OFFSET + 0, 1),  # 13  0xd
                Inst("jz .l2", 2, 0, 0),  # 20 0x14
                Inst(".l1:", 0, 0, 0),  # 22 0x16
                Inst("mov qword ptr [r14], 2", 7, MAIN_OFFSET + 0, 1),  # 22 0x16
                Inst("mov rbx, 1", 7, 0, 0),  # 29  0x1d
                Inst(".l2:", 0, 0, 0),  # 36  0x24
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),  # 36
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            exec_clause=["cond"],
        )
        self.assertEqual(len(ctraces), 1)

        expected_trace = test_case.get_expected_observations(
            [
                0,
                1,  # first misprediction
                3,
                4,  # no misprediction on the second branch (nesting = 1)
                9,  # first rollback
                9,  # exit
            ],
            True,
            True,
            False)

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    def test_ct_cond_double(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),  # 8
                Inst("jz .l2", 2, 0, 0),  # 11 0xb
                Inst(".l0:", 0, 0, 0),  # 13
                Inst("mov qword ptr [r14], 1", 7, MAIN_OFFSET + 0, 1),  # 13  0xd
                Inst("jz .l2", 2, 0, 0),  # 20 0x14
                Inst(".l1:", 0, 0, 0),  # 22 0x16
                Inst("mov qword ptr [r14], 2", 7, MAIN_OFFSET + 0, 1),  # 22 0x16
                Inst("mov rbx, 1", 7, 0, 0),  # 29  0x1d
                Inst(".l2:", 0, 0, 0),  # 36  0x24
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),  # 36
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            test_case=test_case,
            input_data=[input_],
            exec_clause=["cond"],
            nesting=2,
        )
        self.assertEqual(len(ctraces), 1)

        expected_trace = test_case.get_expected_observations(
            [
                0,
                1,  # first misprediction
                3,
                4,  # second misprediction
                6,
                7,
                9,  # first rollback
                9,  # second rollback
                9,  # exit
            ],
            True,
            True,
            False)
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    def test_rollback_on_fence(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst("lfence", 2, 0, 0),
                Inst("mov rax, qword ptr [r14 + 2]", 5, MAIN_OFFSET + 2, 2),
                Inst(".l1:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["cond"],
            test_case=test_case,
            input_data=[input_],
        )
        self.assertEqual(len(ctraces), 1)

        expected_trace = test_case.get_expected_observations([0, 1, 3, 4, 6], True, True, False)
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_ct_bpas(self) -> None:
        test_case = InstList(
            [
                Inst("mov qword ptr [r14], 42", 7, MAIN_OFFSET + 0, TEST_MEM_VALUE_A),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, TEST_MEM_VALUE_A),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + TEST_MEM_VALUE_A, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["bpas"],
            test_case=test_case,
            input_data=[input_],
        )

        expected_trace: List[int] = []
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)

        # speculative
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(test_case[1].mem_address)
        rax = MEM_DEFAULT_VALUE
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(MAIN_OFFSET + rax)
        expected_trace.append(test_case[3].pc_offset)

        # after rollback
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(test_case[1].mem_address)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_fault_handling(self) -> None:
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14 + 0x1000]", 7, FAULTY_OFFSET, 0),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + 3, 0),
                Inst("mov rbx, qword ptr [r14 + rbx]", 4, MAIN_OFFSET + REG_DEFAULT_VALUE, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            test_case=test_case, input_data=[input_], nesting=1, pte_mask=PF_MASK)

        # Fault at instruction 0: PC, mem_addr, and RSP (fault handler stack)
        expected_trace = test_case.get_expected_observations([0], True, True, False)
        expected_trace.append(RSP_DEFAULT_VALUE)  # Stack pointer from fault handler
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_ct_deh(self) -> None:
        # Test X86UnicornDEH with CTTracer (Delayed Exception Handling)
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14 + 0x1000]", 7, FAULTY_OFFSET, 0),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + 3, 0),
                Inst("mov rbx, qword ptr [r14 + rbx]", 4, MAIN_OFFSET + REG_DEFAULT_VALUE, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["delayed-exception-handling"],
            test_case=test_case,
            input_data=[input_],
            pte_mask=PF_MASK)

        # DEH: fault at 0, continue speculatively to 2, then handle fault
        expected_trace: List[int] = []
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        expected_trace.append(RSP_DEFAULT_VALUE)
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)
        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_ct_nullinj_assist(self) -> None:
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14 + 0x1000]", 7, FAULTY_OFFSET, 0),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + 3, 0),
                Inst("mov rbx, qword ptr [r14 + rbx]", 4, MAIN_OFFSET + REG_DEFAULT_VALUE, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["nullinj-assist"],
            test_case=test_case,
            input_data=[input_],
            pte_mask=PF_MASK)

        # Complex trace: fault, re-execute with null injection, speculate, rollback, re-execute
        # Manual construction needed due to complex execution flow
        expected_trace: List[int] = []
        # fault
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        expected_trace.append(RSP_DEFAULT_VALUE)
        # re-execute with changed permissions and inject zero into rax
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        rax = 0
        # execute with speculative rax
        expected_trace.append(test_case[1].pc_offset)  # traced twice due to a quirk in Unicorn
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(MAIN_OFFSET + rax)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)  # measurement_end
        # rollback and re-execute without a fault
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(test_case[1].mem_address)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)  # measurement_end

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_ct_nullinj_term(self) -> None:
        # Test X86UnicornNull with CTTracer (null injection with termination)
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14 + 0x1000]", 7, FAULTY_OFFSET, 0),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + 3, 0),
                Inst("mov rbx, qword ptr [r14 + rbx]", 4, MAIN_OFFSET + REG_DEFAULT_VALUE, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["nullinj-fault"],
            test_case=test_case,
            input_data=[input_],
            pte_mask=PF_MASK)

        # Complex trace: fault, re-execute with null injection, speculate (no rollback)
        expected_trace: List[int] = []
        # fault
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        expected_trace.append(RSP_DEFAULT_VALUE)
        # re-execute with changed permissions and inject zero into rax
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        rax = 0
        # execute with speculative rax (terminates without rollback)
        expected_trace.append(test_case[1].pc_offset)  # traced twice due to a quirk in Unicorn
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(MAIN_OFFSET + rax)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)  # end nop

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_ct_meltdown(self) -> None:
        # Test X86Meltdown with CTTracer (Meltdown vulnerability)
        test_case = InstList(
            [
                Inst("mov rax, qword ptr [r14 + 0x1000]", 7, FAULTY_OFFSET, 0),
                Inst("mov rax, qword ptr [r14 + rax]", 4, MAIN_OFFSET + 3, 0),
                Inst("mov rbx, qword ptr [r14 + rbx]", 4, MAIN_OFFSET + REG_DEFAULT_VALUE, 0),
            ],
            backend="uc",
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            exec_clause=["meltdown"], test_case=test_case, input_data=[input_], pte_mask=PF_MASK)

        # Meltdown: fault, re-execute with leaked value, speculate
        expected_trace: List[int] = []
        # fault
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        expected_trace.append(RSP_DEFAULT_VALUE)
        # re-execute with changed permissions and inject leaked value into rax
        expected_trace.append(test_case[0].pc_offset)
        expected_trace.append(test_case[0].mem_address)
        rax = MEM_FAULTY_DEFAULT_VALUE
        # execute with speculative rax containing leaked data
        expected_trace.append(test_case[1].pc_offset)
        expected_trace.append(MAIN_OFFSET + rax)
        expected_trace.append(test_case[2].pc_offset)
        expected_trace.append(test_case[2].mem_address)
        expected_trace.append(test_case[3].pc_offset)  # measurement_end

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("dr")
    def test_arch_seq(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst(".l1:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(obs_clause="arch", test_case=test_case, input_data=[input_])
        self.assertEqual(len(ctraces), 1)

        # ArchTracer observes PC, memory addresses, and values
        # Plus initial register state (7 registers)
        reg_state = [REG_DEFAULT_VALUE] * 7
        trace_observations = test_case.get_expected_observations([0, 1, 4], True, True, True)
        expected_trace = reg_state + trace_observations

        self.assertEqual(ctraces[0].get_untyped(), expected_trace)

    @skip_for_backend("uc")
    def test_ind(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("lea rax,qword ptr [rip+.l0]", 7, 0, 0),
                Inst("call rax", 2, 0, 0),
                Inst(".end:", 0, 0, 0),
                Inst("jmp .l2", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst("ret", 1, 0, 0),
                Inst(".l2:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(obs_clause="ind", test_case=test_case, input_data=[input_])
        self.assertEqual(len(ctraces), 1)

        expected_trace: List[int] = []
        # Call (src and dest)
        expected_trace.append(test_case[3].pc_offset)
        expected_trace.append(test_case[6].pc_offset)
        # Ret (src and dest)
        expected_trace.append(test_case[8].pc_offset)
        expected_trace.append(test_case[4].pc_offset)

        # Node: last two rets are inserted by the instrumentation: ignore them
        self.assertEqual(ctraces[0].get_untyped()[:-2], expected_trace)

    @skip_for_backend("uc")
    def test_ind_spec(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .end", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("lea rax,qword ptr [rip+.l3]", 7, 0, 0),
                Inst("call rax", 2, 0, 0),
                Inst(".l1:", 0, 0, 0),
                Inst("xor rax, rax", 3, 0, 0),
                Inst("mov rax, qword ptr [rax]", 3, MAIN_OFFSET + 0, 1),
                Inst("call rax", 2, 0, 0),
                Inst(".l2:", 0, 0, 0),
                Inst("jmp .end", 2, 0, 0),
                Inst(".l3:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst("ret", 1, 0, 0),
                Inst(".end:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()
        ctraces = self._get_trace(
            obs_clause="ind", exec_clause=["cond"], test_case=test_case, input_data=[input_])
        self.assertEqual(len(ctraces), 1)

        expected_trace: List[int] = []

        # Call (src and dest)
        expected_trace.append(test_case[5].pc_offset)
        expected_trace.append(test_case[13].pc_offset)
        # Ret (src and dest)
        expected_trace.append(test_case[14].pc_offset)
        expected_trace.append(test_case[6].pc_offset)

        # Node: last two rets are inserted by the instrumentation: ignore them
        self.assertEqual(ctraces[0].get_untyped()[:-2], expected_trace)

    @skip_for_backend("uc")
    def test_ind_poison(self) -> None:
        test_case = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .end", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("lea rax,qword ptr [rip+.l3]", 7, 0, 0),
                Inst("call rax", 2, 0, 0),
                Inst(".l1:", 0, 0, 0),
                Inst("xor rax, rax", 3, 0, 0),
                Inst("mov rax, qword ptr [rax]", 3, MAIN_OFFSET + 0, 1),
                Inst("call rax", 2, 0, 0),
                Inst(".l2:", 0, 0, 0),
                Inst("jmp .end", 2, 0, 0),
                Inst(".l3:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst("ret", 1, 0, 0),
                Inst(".end:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        input_ = self._input_builder.get_default_input()

        model = self._get_model("ind", ["cond"], (DATA_BASE, CODE_BASE))
        model.poison_value = POISON_VALUE  # type: ignore

        tc = test_case.to_test_case()
        model.load_test_case(tc)

        ctraces = model.trace_test_case([input_], 1)
        code_base_addr = model.layout.code_start()
        self.assertEqual(len(ctraces), 1)

        expected_trace: List[int] = []

        # Call (src and dest)
        expected_trace.append(test_case[5].pc_offset)
        expected_trace.append(test_case[13].pc_offset)
        # Ret (src and dest)
        expected_trace.append(test_case[14].pc_offset)
        expected_trace.append(test_case[6].pc_offset)
        # Second call: this is reachable only if speculation doesn't get rolled-back on the
        # previous faulty load.
        expected_trace.append(test_case[9].pc_offset)
        # The call should be trying to jump to the poison value
        expected_trace.append(model.poison_value - code_base_addr)  # type: ignore

        # Node: last two rets are inserted by the instrumentation: ignore them
        self.assertEqual(ctraces[0].get_untyped()[:-2], expected_trace)


class X86DRModelTest(_SharedX86Model):
    """Unit tests for the x86 DynamoRIO backend adaptor."""

    def __init__(self, methodName: str) -> None:
        super().__init__(methodName)
        self._backend = "dr"
        self._backend_long = "dynamorio"

    @classmethod
    def setUpClass(cls) -> None:
        cls._configure_class("dynamorio")

    @classmethod
    def tearDownClass(cls) -> None:
        cls._teardown_class()

    def setUp(self) -> None:
        self._skip_if_not_installed()
        super().setUp()

    def _skip_if_not_installed(self) -> None:
        try:
            DynamoRIOModel._check_if_installed()
        except FileNotFoundError:
            self.skipTest("DynamoRIO is not installed")

    def _get_model(self,
                   obs_clause: str,
                   exec_clause: List[str],
                   data_bases: Tuple[int, int],
                   enable_mismatch_check: bool = False) -> DynamoRIOModel:
        CONF.contract_observation_clause = obs_clause
        CONF.contract_execution_clause = exec_clause
        CONF.model_backend = "dynamorio"
        model = get_model(data_bases, enable_mismatch_check_mode=enable_mismatch_check)
        assert isinstance(model, DynamoRIOModel)
        return model

    def test_clause_configuration(self) -> None:
        # Create a model instance
        model = self._get_model("ct", ["seq"], (DATA_BASE, CODE_BASE))
        self.assertEqual(model._obs_clause_name, "ct")
        self.assertEqual(model._exec_clause_name, "seq")

        # Set new clauses (invalid)
        with self.assertRaises(ConfigException) as e:
            _ = self._get_model("invalid", ["seq"], (DATA_BASE, CODE_BASE))
        self.assertIn("unsupported observation clause", str(e.exception))
        self.assertIn("- ct", str(e.exception))

        with self.assertRaises(ConfigException) as e:
            _ = self._get_model("ct", ["invalid"], (DATA_BASE, CODE_BASE))
        self.assertIn("unsupported execution clause", str(e.exception))
        self.assertIn("- seq", str(e.exception))

        # Set new clauses (invalid, alt interface)
        model = DynamoRIOModel((DATA_BASE, CODE_BASE))
        with self.assertRaises(ValueError):
            model.configure_clauses("invalid", "seq")
        with self.assertRaises(ValueError):
            model.configure_clauses("ct", "invalid")

        self._restore_conf()

    def test_load_test_case(self) -> None:
        model = self._get_model("ct", ["seq"], (DATA_BASE, CODE_BASE))
        inst = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
            ],
            backend=self._backend,
        )
        tc = inst.to_test_case()
        model.load_test_case(tc)

        # Check that a temporary file was created and that it contains the test case
        self.assertIsNotNone(model._files.rcbf)
        assert model._files.rcbf is not None
        with open(model._files.rcbf, "rb") as f:
            rcbf_data = f.read()
        self.assertNotEqual(len(rcbf_data), 0)

        self._restore_conf()

    def test_tc_dispatch(self) -> None:
        # Test that the tracing functions create RDBF and RCBF files

        model = self._get_model("ct", ["seq"], (DATA_BASE, CODE_BASE))
        inst = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
            ],
            backend=self._backend,
        )
        tc = inst.to_test_case()
        model.load_test_case(tc)
        _ = model.trace_test_case([InputData()], 1)

        # RDBF
        self.assertIsNotNone(model._files.rdbf)
        assert model._files.rdbf is not None
        with open(model._files.rdbf, "rb") as f:
            rdbf_data = f.read()
        self.assertNotEqual(len(rdbf_data), 0)
        # FIXME: the next two statements should be a part of test_case_data tests
        self.assertEqual(rdbf_data[0], 1)  # number of actors
        self.assertEqual(rdbf_data[8], 1)  # number of inputs

        # RCBF
        self.assertIsNotNone(model._files.rcbf)
        assert model._files.rcbf is not None
        with open(model._files.rcbf, "rb") as f:
            rcbf_data = f.read()
        self.assertEqual(rcbf_data[0], 1)  # number of actors

        # Check that loading another test case with a different input overwrites the files
        inst = InstList(
            [
                Inst("xor rax, rax", 3, 0, 0),
                Inst("jz .l1", 2, 0, 0),
                Inst(".l0:", 0, 0, 0),
                Inst("mov rax, qword ptr [r14]", 3, MAIN_OFFSET + 0, 1),
                Inst(".l1:", 0, 0, 0),
            ],
            backend=self._backend,
        )
        tc = inst.to_test_case()
        input_ = InputData()
        input_[0]["main"][0] = TEST_MEM_VALUE_A
        model.load_test_case(tc)
        _ = model.trace_test_case([input_], 1)

        with open(model._files.rcbf, "rb") as f:
            rcbf_data2 = f.read()
        self.assertNotEqual(len(rcbf_data2), 0)
        self.assertNotEqual(rcbf_data, rcbf_data2)

        with open(model._files.rdbf, "rb") as f:
            rdbf_data2 = f.read()
        self.assertNotEqual(len(rdbf_data2), 0)
        self.assertNotEqual(rdbf_data, rdbf_data2)

        self._restore_conf()


class UnicornModelTest(_SharedX86Model):  # pylint: disable=too-many-public-methods
    """Unit tests for the x86 Unicorn backend adaptor."""

    def __init__(self, methodName: str) -> None:
        super().__init__(methodName)
        self._backend = "uc"
        self._backend_long = "unicorn"

    @classmethod
    def setUpClass(cls) -> None:
        cls._configure_class("unicorn", {
            'instruction_set': 'x86-64',
            'data_generator_seed': 10,
        })

    @classmethod
    def tearDownClass(cls) -> None:
        cls._teardown_class()

    def _get_model(self,
                   obs_clause: str,
                   exec_clause: List[str],
                   data_bases: Tuple[int, int],
                   enable_mismatch_check: bool = False) -> X86UnicornModel:
        CONF.contract_observation_clause = obs_clause
        CONF.contract_execution_clause = exec_clause
        CONF.model_backend = "unicorn"
        model = get_model(data_bases, enable_mismatch_check_mode=enable_mismatch_check)
        assert isinstance(model, X86UnicornModel)
        return model


if __name__ == '__main__':
    unittest.main()


================================================
FILE: tests/x86_tests/unit_taint_tracker.py
================================================
"""
File: collection of tests for the taint tracking logic in all model backends

Copyright (C) Microsoft Corporation
SPDX-License-Identifier: MIT
"""
# pylint: disable=missing-function-docstring
# pylint: disable=missing-class-docstring
# pylint: disable=too-many-public-methods

import unittest
from abc import ABC
from typing import List, Tuple, Union
from copy import deepcopy

from rvzr.model_unicorn.model import X86UnicornModel
from rvzr.model_dynamorio.model import DynamoRIOModel
from rvzr.tc_components.test_case_data import InputData, InputTaint
from rvzr.traces import CTrace
from rvzr.factory import get_model
from rvzr.config import CONF, Conf
from rvzr.logs import update_logging_after_config_change

from .model_common import Inst, InstList, DATA_BASE, CODE_BASE, Backend, \
    RAX, RBX, RCX, FLAGS, XMM0, InputBuilder


# ==================================================================================================
# Tests
# ==================================================================================================
class _SharedTaintTrackerTest(ABC, unittest.TestCase):
    """Abstract base class for X86 taint tracking tests.

    Subclasses must define:
        _backend: Backend type ("dr" or "uc")
        _model_backend_name: Model backend name ("dynamorio" or "unicorn")
    """

    _prev_conf: Conf
    _backend: Backend
    _model_backend_name: str

    # Exclude this parent class from test discovery
    @classmethod
    def setUpClass(cls) -> None:
        if cls is _SharedTaintTrackerTest:
            raise unittest.SkipTest("Skipping base class")
        # Validate that subclass defines required attributes
        if not hasattr(cls, '_backend') or not hasattr(cls, '_model_backend_name'):
            raise TypeError(
                f"{cls.__name__} must define class attributes '_backend' and '_model_backend_name'")
        # Save and configure settings for taint tracking tests
        cls._prev_conf = deepcopy(CONF)
        CONF.instruction_set = "x86-64"
        CONF.model_backend = cls._model_backend_name
        CONF._no_generation = True  # type: ignore
        CONF.logging_modes = []
        update_logging_after_config_change()

    @classmethod
    def tearDownClass(cls) -> None:
        # Restore configuration
        for attr, value in cls._prev_conf.__dict__.items():
            setattr(CONF, attr, value)

    def __init__(self, methodName: str) -> None:
        super().__init__(methodName)
        self._input_builder = InputBuilder()

    def _get_model(self) -> Union[DynamoRIOModel, X86UnicornModel]:
        """Create a model configured for taint tracking."""
        CONF.contract_observation_clause = "ct"
        CONF.contract_execution_clause = ["seq"]
        CONF.model_backend = self._model_backend_name
        model = get_model((DATA_BASE, CODE_BASE), enable_mismatch_check_mode=False)
        assert isinstance(model, (DynamoRIOModel, X86UnicornModel))
        return model

    def _trace_with_taints(self, test_case: InstList,
                           inputs: List[InputData]) -> Tuple[List[CTrace], List[InputTaint]]:
        """Helper to load test case and trace with taints."""
        model = self._get_model()
        tc = test_case.to_test_case()
        model.load_test_case(tc)
        ctraces, taints = model.trace_test_case_with_taints(inputs, nesting=1)
        return ctraces, taints

    def _run_taint_test(self, instructions: List[Inst], input_: InputData) -> InputTaint:
        """Run a taint test and return the taint result for the first input.

        :param instructions: List of instructions to execute
        :param input_: Input data to use for the test
        :return: Taint information for the first input
        """
        test_case = InstList(instructions, backend=self._backend)
        _, taints = self._trace_with_taints(test_case, [input_])
        return taints[0]

    def test_basic_taint(self) -> None:
        instructions = [
            Inst("mov rax, qword ptr [r14 + rax]", 3, 0, 0),
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX)
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['gpr'][RAX])

    def test_reg_to_reg(self) -> None:
        instructions = [
            Inst("add rax, rbx", 0, 0, 0),
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX, RBX)
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['gpr'][RAX])
        self.assertTrue(taint[0]['gpr'][RBX])

    def test_mem_to_reg(self) -> None:
        instructions = [
            Inst("mov rbx, qword ptr [r14 + rbx]", 0, 0, 0),  # main[0] -> RBX
            Inst("mov rax, rbx", 0, 0, 0),  # RBX -> RAX
            Inst("and rax, 0b1", 0, 0, 0),
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),  # RAX tainted
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX, RBX)
        taint = self._run_taint_test(instructions, input_)
        self.assertFalse(taint[0]['gpr'][RAX])
        self.assertTrue(taint[0]['gpr'][RBX])
        self.assertTrue(taint[0]['main'][0])

    def test_load_to_store(self) -> None:
        instructions = [
            Inst("mov qword ptr [r14], rax", 0, 0, 0),  # RAX -> main[0]
            Inst("mov rbx, qword ptr [r14]", 0, 0, 0),  # main[0] -> RBX
            Inst("mov rax, qword ptr [r14 + rbx]", 0, 0, 0),  # RBX tainted
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX, RBX)
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['gpr'][RAX])
        self.assertFalse(taint[0]['gpr'][RBX])

    def test_unaligned_memory_access_taints_both_qwords(self) -> None:
        # Memory accesses spanning 8-byte boundaries must taint both qwords
        instructions = [
            Inst("mov rax, qword ptr [r14 + 0x4]", 0, 0, 0),  # main[0:1] -> RAX
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),  # RAX tainted
        ]
        input_ = self._input_builder.get_input_with_zeroed_memory(main=0)
        input_[0]['main'][1] = 0
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['main'][0])
        self.assertTrue(taint[0]['main'][1])

    def test_simd_register_dependencies_are_tracked(self) -> None:
        # Taint tracking should work for SIMD (XMM) registers
        instructions = [
            Inst("movaps xmm0, xmm1", 0, 0, 0),  # XMM1 -> XMM0
            Inst("movaps xmmword ptr [r14], xmm0", 0, 0, 0),  # XMM0 -> main[0]
            Inst("mov rax, qword ptr [r14]", 0, 0, 0),  # main[0] -> RAX
            Inst("and rax, 0b1", 0, 0, 0),
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),  # RAX tainted
        ]
        input_ = InputData()
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['simd'][XMM0])

    def test_32bit_writes_preserve_64bit_dependencies(self) -> None:
        # Writing to 32-bit registers (eax) should preserve dependencies from 64-bit (rax)
        instructions = [
            Inst("mov rax, rbx", 0, 0, 0),  # RBX -> RAX
            Inst("mov eax, ecx", 0, 0, 0),  # ECX -> EAX (RAX must remain dependent on RBX)
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),  # RAX tainted
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX, RBX, RCX)
        taint = self._run_taint_test(instructions, input_)
        self.assertFalse(taint[0]['gpr'][RAX])
        self.assertTrue(taint[0]['gpr'][RBX])
        self.assertTrue(taint[0]['gpr'][RCX])

    def test_lea_address_computation_propagates_taint(self) -> None:
        # LEA computes addresses; operands used in address calculation should be tainted
        instructions = [
            Inst("lea rax, qword ptr [rbx]", 0, 0, 0),  # RBX -> RAX
            Inst("mov rax, qword ptr [r14 + rax]", 0, 0, 0),  # RAX tainted
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX, RBX)
        taint = self._run_taint_test(instructions, input_)
        self.assertFalse(taint[0]['gpr'][RAX])
        self.assertTrue(taint[0]['gpr'][RBX])

    def test_control_flow_dependency_taints_condition(self) -> None:
        # Data used in conditional branches creates control-flow dependencies
        instructions = [
            Inst("mov rax, qword ptr [r14 + 0x0]", 0, 0, 0),  # main[0] -> RAX
            Inst("cmp rax, 0", 0, 0, 0),  # RAX -> flags
            Inst("je .label", 0, 0, 0),  # Conditional branch on flags
            Inst(".label:", 0, 0, 0),
        ]
        input_ = self._input_builder.get_input_with_zeroed_gprs(RAX)
        taint = self._run_taint_test(instructions, input_)
        self.assertTrue(taint[0]['gpr'][FLAGS])
        self.assertTrue(taint[0]['main'][0])
        self.assertFalse(taint[0]['gpr'][RAX])


class X86DRTaintTrackerTest(_SharedTaintTrackerTest):
    """Unit tests for the x86 DynamoRIO backend adaptor."""

    _backend: Backend = "dr"
    _model_backend_name: str = "dynamorio"

    def _skip_if_not_installed(self) -> None:
        try:
            DynamoRIOModel._check_if_installed()  # type: ignore
        except FileNotFoundError:
            self.skipTest("DynamoRIO is not installed")

    def setUp(self) -> None:
        self._skip_if_not_installed()


class UnicornTaintTrackerTest(_SharedTaintTrackerTest):  # pylint: disable=too-many-public-methods
    """Unit tests for the x86 Unicorn backend adaptor."""

    _backend: Backend = "uc"
    _model_backend_name: str = "unicorn"


if __name__ == '__main__':
    unittest.main()